diff --git a/.gitattributes b/.gitattributes index 98870b57a7ecb3ffaf218590b389ba1bd19be488..ef0da8d342aba2f3cff1bdf74da0098629d4d0fa 100644 --- a/.gitattributes +++ b/.gitattributes @@ -34,3 +34,8 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text wandb/wandb/run-20251002_155442-6v8q0jgn/run-6v8q0jgn.wandb filter=lfs diff=lfs merge=lfs -text +wandb/wandb/run-20251002_151047-gal9lnsm/run-gal9lnsm.wandb filter=lfs diff=lfs merge=lfs -text +wandb/wandb/run-20251002_155441-70dhy5dq/run-70dhy5dq.wandb filter=lfs diff=lfs merge=lfs -text +wandb/wandb/run-20251002_150921-kqbx0cjv/run-kqbx0cjv.wandb filter=lfs diff=lfs merge=lfs -text +cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/run-76mxu43t.wandb filter=lfs diff=lfs merge=lfs -text +wipe_l1_regression/wandb/wandb/run-20251005_163743-a1znetn8/run-a1znetn8.wandb filter=lfs diff=lfs merge=lfs -text diff --git a/all_l1/step8500/config.yaml b/all_l1/step8500/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..405080ae17ead9c64a4104eb1a37b6cd91d9c6bd --- /dev/null +++ b/all_l1/step8500/config.yaml @@ -0,0 +1,322 @@ +run_name: realworld_20250930_131219 +seed: 6198 +epoch: null +dry_run: false +model: + d_model: 3584 + n_heads: 28 + n_kv_heads: 4 + qkv_bias: true + clip_qkv: null + n_layers: 28 + mlp_ratio: 4 + mlp_hidden_size: 37888 + activation_type: swiglu + block_type: sequential + block_group_size: 1 + rope: true + rope_full_precision: true + rope_theta: 1000000.0 + vision_backbone: + image_model_type: openai + image_default_input_size: + - 336 + - 336 + image_patch_size: 14 + image_pos_patch_size: 14 + image_emb_dim: 1024 + image_num_heads: 16 + image_num_key_value_heads: 16 + image_num_layers: 23 + image_head_dim: 64 + image_mlp_dim: 4096 + image_mlp_activations: quick_gelu + image_dropout_rate: 0.0 + image_num_pos: 577 + image_norm_eps: 1.0e-05 + attention_dropout: 0.0 + residual_dropout: 0.0 + initializer_range: 0.02 + fsdp_wrap: false + resize_mode: default + vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt + llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt + low_cpu_fsdp: true + attention_type: sdpa + float32_attention: true + attention_dropout: 0.0 + attention_layer_norm: false + residual_dropout: 0.1 + response_residual_dropout: 0.0 + embedding_dropout: 0.0 + layer_norm_type: rms + layer_norm_with_affine: true + layer_norm_eps: 1.0e-06 + attention_layer_norm_with_affine: true + max_sequence_length: 4096 + max_position_embeddings: null + include_bias: false + bias_for_layer_norm: null + scale_logits: false + vocab_size: 152064 + embedding_size: 152064 + ff_out_size: 0 + additional_vocab_size: 128 + new_embedding_init_range: 0.02 + weight_tying: false + init_device: null + init_fn: normal + init_std: 0.02 + init_cutoff_factor: null + norm_after: false + precision: amp_bf16 + max_crops: 12 + crop_mode: overlap-and-resize-c2 + use_col_tokens: true + prompt_type: uber_model + system_prompt_kind: demo_or_style + message_formatting: role + always_start_with_space: true + multi_annotation_weighting: root_subsegments + default_inference_len: 65 + overlap_margins: + - 4 + - 4 + pad_value: 0.0 + image_padding_embed: pad_and_partial_pad + fix_image_padding: true + vit_layers: + - -2 + - -9 + image_pooling_h: 2 + image_pooling_w: 2 + image_pooling_2d: attention_meanq + image_projector: mlp + image_feature_dropout: 0.0 + initializer_range: 0.02 + normalize_input_embeds: false + use_position_ids: true + head_dim: null + action_tokenizer: + identifier: physical-intelligence/fast + tokenizer_dir: null + action_dim: 7 + horizon: 8 + tokenizer: + identifier: Qwen/Qwen2-7B + tokenizer_dir: null + pad_tokenizer: true + moe_num_experts: 8 + moe_top_k: 2 + moe_mlp_impl: sparse + moe_log_expert_assignment: false + moe_shared_expert: false + moe_lbl_in_fp32: false + moe_interleave: false + moe_loss_weight: 0.1 + moe_zloss_weight: null + moe_dropless: true + moe_capacity_factor: 1.25 + action_head: l1_regression + num_diffusion_steps: 1000 + num_diffusion_inference_steps: 30 + use_proprio: true + action_head_dit_hidden_size: 1152 + action_head_dit_depth: 28 + action_head_dit_num_heads: 16 + llm_causal_attention: false + action_use_left_eef: true + action_use_mobile_base: false +allow_resume: false +ft_llm: true +ft_vit: false +ft_connector: false +ft_embedding: lm_head +lora: false +use_lora: true +lora_rank: 8 +lora_llm: false +lora_vit: false +lora_connector: false +early_exit: false +train_exit_random_layer: false +optimizer: + name: adamw + learning_rate: 0.0001 + weight_decay: 0.01 + betas: + - 0.9 + - 0.95 + eps: 1.0e-05 + connector_learning_rate: 0.0002 + vit_learning_rate: 6.0e-06 + llm_learning_rate: 5.0e-05 + connector_weight_decay: 0.0 + vit_weight_decay: 0.0 + llm_weight_decay: 0.0 + connector_betas: + - 0.9 + - 0.95 + vit_betas: + - 0.9 + - 0.95 + llm_betas: + - 0.9 + - 0.95 + connector_eps: 1.0e-06 + vit_eps: 1.0e-06 + llm_eps: 1.0e-06 + metrics_log_interval: 20 +scheduler: + name: multimodal + units: steps + t_warmup: 100 + t_max: null + alpha_f: 0.1 + connector_t_warmup: 200 + vit_t_warmup: 2000 + llm_t_warmup: 2000 + grad_clip_warmup_steps: null + grad_clip_warmup_factor: null + warmup_min_lr: 0.0 +data: + dataset: vla_dataset_realworld + mixture: null + root_size_mixture: null + split: train + seed: 95818 + shuffle_messages: false + pad: to_max + sequence_length: 1600 + shuffle: true + for_inference: false + multi_modal: torch + num_workers: 0 + drop_last: true + pin_memory: true + prefetch_factor: null + persistent_workers: false + timeout: 0 + rlds_dataset_name: libero_4_task_suites_no_noops + rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Wipe + use_wrist_image: true + use_proprio: true + rlds_shuffle_buffer_size: 100000 + rlds_traj_threads: 8 + rlds_read_threads: 8 + lerobot_episode_index_start: null + lerobot_episode_index_end: null +restore_dataloader: true +fast_forward_batches: null +evaluators: +- label: val + data: + dataset: vla_dataset_realworld + mixture: null + root_size_mixture: null + split: validation + seed: null + shuffle_messages: false + pad: to_max + sequence_length: 1600 + shuffle: false + for_inference: false + multi_modal: torch + num_workers: 0 + drop_last: true + pin_memory: true + prefetch_factor: null + persistent_workers: true + timeout: 0 + rlds_dataset_name: libero_4_task_suites_no_noops + rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds + use_wrist_image: true + use_proprio: true + rlds_shuffle_buffer_size: 256000 + rlds_traj_threads: 8 + rlds_read_threads: 8 + lerobot_episode_index_start: 353 + lerobot_episode_index_end: 765 + device_eval_batch_size: null + subset_num_batches: 64 + max_examples: null + max_new_tokens: 448 + mm_evaluator: null + save_dir: null + save_to_checkpoint_dir: false + eval_name: null + skip_if_metrics_cached: true +eval_interval: 0 +inf_eval_interval: -1 +inf_evaluators: [] +save_folder: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/all_l1 +remote_save_folder: null +canceled_check_interval: 50 +save_interval: 500 +save_interval_unsharded: 500 +save_interval_ephemeral: null +save_interval_action_head: 500 +save_num_checkpoints_to_keep: 1 +save_num_unsharded_checkpoints_to_keep: 1 +save_num_action_head_checkpoints_to_keep: 2 +save_overwrite: true +force_save_unsharded: false +no_pre_train_checkpoint: true +initial_model_checkpoint: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924 +load_model_config: null +checkpoint_dir: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924 +load_path: null +load_path_sharded_checkpointer: null +reset_optimizer_state: false +reset_trainer_state: false +save_dataloader_state: false +reset_dataloader_state: false +keep_lr_on_load: true +sharded_checkpointer: torch_legacy +max_duration: 500000 +global_train_batch_size: 126 +device_train_batch_size: 15 +device_train_microbatch_size: 16 +device_eval_batch_size: 4 +eval_subset_num_batches: -1 +eval_on_load: false +device_inf_eval_batch_size: 16 +inf_eval_subset_num_batches: -1 +device_train_grad_accum: 0 +max_grad_norm: 1.0 +multi_component_grad_norm: true +batch_divisor: global_batch +max_grad_norm_ratio: null +precision: amp_bf16 +wandb: + project: a1-realworld + entity: henryeap + group: null + name: realworld_20250930_131219 + tags: + - watching + log_artifacts: false + rank_zero_only: true + log_interval: 1 +speed_monitor: + window_size: 20 + gpu_flops_available: null +console_log_interval: 1 +gen1_gc_interval: 1 +compile: null +fsdp: + use_orig_params: true + sharding_strategy: FULL_SHARD + wrapping_strategy: by_block_and_size + precision: float + hybrid_sharding_num_model_replicas: null +softmax_auxiliary_loss: true +softmax_auxiliary_loss_scale: 0.0001 +time_limit: null +extra_steps_after_cancel: 10 +python_profiling: false +torch_profiling: false +stop_at: 500000 +stop_after: null +activation_checkpointing: whole_layer +fused_loss: null diff --git a/cleandesk50_flow_matching/wandb/wandb/debug-internal.log b/cleandesk50_flow_matching/wandb/wandb/debug-internal.log new file mode 100644 index 0000000000000000000000000000000000000000..8994a86d9e8db1039a6826879c432376be5640d5 --- /dev/null +++ b/cleandesk50_flow_matching/wandb/wandb/debug-internal.log @@ -0,0 +1,12 @@ +{"time":"2025-10-08T16:38:34.806823131Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"} +{"time":"2025-10-08T16:38:35.95264112Z","level":"INFO","msg":"stream: created new stream","id":"quokv8gn"} +{"time":"2025-10-08T16:38:35.952698801Z","level":"INFO","msg":"stream: started","id":"quokv8gn"} +{"time":"2025-10-08T16:38:35.952731371Z","level":"INFO","msg":"sender: started","stream_id":"quokv8gn"} +{"time":"2025-10-08T16:38:35.952734591Z","level":"INFO","msg":"writer: started","stream_id":"quokv8gn"} +{"time":"2025-10-08T16:38:35.952725981Z","level":"INFO","msg":"handler: started","stream_id":"quokv8gn"} +{"time":"2025-10-08T16:43:59.99384105Z","level":"INFO","msg":"handler: operation stats","stats":{"operations":[{"desc":"updating run metadata","runtime_seconds":0.001054985}],"total_operations":1}} +{"time":"2025-10-08T16:44:01.036808965Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"} +{"time":"2025-10-08T16:44:01.423613682Z","level":"INFO","msg":"stream: closing","id":"quokv8gn"} +{"time":"2025-10-08T16:44:01.423631393Z","level":"INFO","msg":"handler: closed","stream_id":"quokv8gn"} +{"time":"2025-10-08T16:44:01.425219996Z","level":"INFO","msg":"sender: closed","stream_id":"quokv8gn"} +{"time":"2025-10-08T16:44:01.425239166Z","level":"INFO","msg":"stream: closed","id":"quokv8gn"} diff --git a/cleandesk50_flow_matching/wandb/wandb/debug.log b/cleandesk50_flow_matching/wandb/wandb/debug.log new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/files/config.yaml b/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/files/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..37eb6982204dbca409b27fda138e0c568d8b9a32 --- /dev/null +++ b/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/files/config.yaml @@ -0,0 +1,623 @@ +_wandb: + value: + cli_version: 0.21.4 + e: + yfehyqgufhcu23nx6cclbs2foj5p3ccp: + args: + - qwen2_7b + - save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk50_flow_matching + - --vision_backbone + - openai + - --action_head + - flow_matching + - --seq_len + - "1600" + - --ft_llm + - --checkpoint + - /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924 + - --device_train_microbatch_size + - "16" + - --global_batch_size + - "126" + - --dataset + - vla_dataset_realworld + - --llm_learning_rate + - "5e-5" + - --wandb_entity + - henryeap + - --wandb_project + - a1-realworld + - --wandb_run_name + - cleandesk50 + - --real_world_vla_config_path + - vla_config_realworld/vla_config_cleandesk50.yaml + - --save_overwrite + codePath: launch_scripts/train_vla.py + codePathLocal: launch_scripts/train_vla.py + cpu_count: 64 + cpu_count_logical: 128 + disk: + /: + total: "470343073792" + used: "50988601344" + email: ihenrykwok@outlook.com + executable: /vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10 + git: + commit: 49712a42d21a8c739a16ba5eeaec4a0d7b29ab80 + remote: https://github.com/Spatialtemporal-AI/A1.git + gpu: Instinct MI210 + gpu_amd: + - id: "1" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0x75d378aea8d8934d" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "4" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0x328cfe1d1a9d2b38" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "6" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0x3c4f0005790d7da3" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "0" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0x763c831cad37d9b" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "3" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0x697c203d8e63f05b" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "7" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0x91078b09ae9b0757" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "2" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0x2433899c197738b6" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "5" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0x2bc0f4cfe424c12a" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + gpu_count: 8 + host: auh7-1b-gpu-319 + memory: + total: "2434606960640" + os: Linux-5.15.0-140-generic-x86_64-with-glibc2.35 + program: /vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py + python: CPython 3.10.18 + root: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk50_flow_matching/wandb + slurm: + cluster_name: ai-04r + conf: /etc/slurm/slurm.conf + cpus_on_node: "128" + gpus_on_node: "8" + gtids: "0" + job_account: faculty-acc + job_cpus_per_node: "128" + job_end_time: "1760200645" + job_gid: "2000" + job_gpus: 0,1,2,3,4,5,6,7 + job_id: "2283" + job_name: mh_cleandesk50_flow_matching + job_nodelist: auh7-1b-gpu-319 + job_num_nodes: "1" + job_partition: faculty + job_qos: xdqos + job_start_time: "1759941445" + job_uid: "2013" + job_user: xiaodan + jobid: "2283" + localid: "0" + nnodes: "1" + nodeid: "0" + nodelist: auh7-1b-gpu-319 + nprocs: "1" + ntasks: "1" + ntasks_per_node: "1" + oom_kill_step: "0" + prio_process: "0" + procid: "0" + submit_dir: /vast/users/xiaodan/zhangjian/A1/launch_scripts + submit_host: auh-1b-cpu-login-001 + task_pid: "152784" + tasks_per_node: "1" + topology_addr: auh7-1b-gpu-319 + topology_addr_pattern: node + startedAt: "2025-10-08T16:38:34.545687Z" + writerId: yfehyqgufhcu23nx6cclbs2foj5p3ccp + m: [] + python_version: 3.10.18 + t: + "1": + - 1 + - 2 + - 3 + - 5 + - 11 + - 41 + - 49 + - 51 + - 53 + - 63 + - 71 + - 83 + - 95 + - 105 + "2": + - 1 + - 2 + - 3 + - 5 + - 11 + - 41 + - 49 + - 51 + - 53 + - 63 + - 71 + - 83 + - 95 + - 105 + "3": + - 2 + - 13 + - 15 + - 16 + - 61 + "4": 3.10.18 + "5": 0.21.4 + "6": 4.56.1 + "10": + - 19 + "12": 0.21.4 + "13": linux-x86_64 +activation_checkpointing: + value: whole_layer +allow_resume: + value: false +batch_divisor: + value: global_batch +canceled_check_interval: + value: 50 +checkpoint_dir: + value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924 +compile: + value: null +console_log_interval: + value: 1 +data: + value: + dataset: vla_dataset_realworld + drop_last: true + for_inference: false + lerobot_episode_index_end: null + lerobot_episode_index_start: null + mixture: null + multi_modal: torch + num_workers: 0 + pad: to_max + persistent_workers: false + pin_memory: true + prefetch_factor: null + rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds + rlds_dataset_name: libero_4_task_suites_no_noops + rlds_read_threads: 8 + rlds_shuffle_buffer_size: 100000 + rlds_traj_threads: 8 + root_size_mixture: null + seed: 95818 + sequence_length: 1600 + shuffle: true + shuffle_messages: false + split: train + timeout: 0 + use_proprio: true + use_wrist_image: true +device_eval_batch_size: + value: 4 +device_inf_eval_batch_size: + value: 16 +device_train_batch_size: + value: 15 +device_train_grad_accum: + value: 0 +device_train_microbatch_size: + value: 16 +dry_run: + value: false +early_exit: + value: false +epoch: + value: null +eval_interval: + value: 0 +eval_on_load: + value: false +eval_subset_num_batches: + value: -1 +evaluators: + value: + - data: + dataset: vla_dataset_realworld + drop_last: true + for_inference: false + lerobot_episode_index_end: 765 + lerobot_episode_index_start: 353 + mixture: null + multi_modal: torch + num_workers: 0 + pad: to_max + persistent_workers: true + pin_memory: true + prefetch_factor: null + rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds + rlds_dataset_name: libero_4_task_suites_no_noops + rlds_read_threads: 8 + rlds_shuffle_buffer_size: 256000 + rlds_traj_threads: 8 + root_size_mixture: null + seed: null + sequence_length: 1600 + shuffle: false + shuffle_messages: false + split: validation + timeout: 0 + use_proprio: true + use_wrist_image: true + device_eval_batch_size: null + eval_name: null + label: val + max_examples: null + max_new_tokens: 448 + mm_evaluator: null + save_dir: null + save_to_checkpoint_dir: false + skip_if_metrics_cached: true + subset_num_batches: 64 +extra_steps_after_cancel: + value: 10 +fast_forward_batches: + value: null +force_save_unsharded: + value: false +fsdp: + value: + hybrid_sharding_num_model_replicas: null + precision: float + sharding_strategy: FULL_SHARD + use_orig_params: true + wrapping_strategy: by_block_and_size +ft_connector: + value: false +ft_embedding: + value: lm_head +ft_llm: + value: true +ft_vit: + value: false +fused_loss: + value: null +gen1_gc_interval: + value: 1 +global_train_batch_size: + value: 126 +inf_eval_interval: + value: -1 +inf_eval_subset_num_batches: + value: -1 +inf_evaluators: + value: [] +initial_model_checkpoint: + value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924 +keep_lr_on_load: + value: true +load_model_config: + value: null +load_path: + value: null +load_path_sharded_checkpointer: + value: null +lora: + value: false +lora_connector: + value: false +lora_llm: + value: false +lora_rank: + value: 8 +lora_vit: + value: false +max_duration: + value: 500000 +max_grad_norm: + value: 1 +max_grad_norm_ratio: + value: null +model: + value: + action_dim: 7 + action_head: flow_matching + action_head_dit_depth: 28 + action_head_dit_hidden_size: 1152 + action_head_dit_num_heads: 16 + action_tokenizer: + identifier: physical-intelligence/fast + tokenizer_dir: null + action_use_left_eef: true + action_use_mobile_base: false + activation_type: swiglu + additional_vocab_size: 128 + always_start_with_space: true + attention_dropout: 0 + attention_layer_norm: false + attention_layer_norm_with_affine: true + attention_type: sdpa + bias_for_layer_norm: null + block_group_size: 1 + block_type: sequential + clip_qkv: null + crop_mode: overlap-and-resize-c2 + d_model: 3584 + default_inference_len: 65 + embedding_dropout: 0 + embedding_size: 152064 + ff_out_size: null + fix_image_padding: true + float32_attention: true + head_dim: null + horizon: 8 + image_feature_dropout: 0 + image_padding_embed: pad_and_partial_pad + image_pooling_2d: attention_meanq + image_pooling_h: 2 + image_pooling_w: 2 + image_projector: mlp + include_bias: false + init_cutoff_factor: null + init_device: null + init_fn: normal + init_std: 0.02 + initializer_range: 0.02 + layer_norm_eps: 1e-06 + layer_norm_type: rms + layer_norm_with_affine: true + llm_causal_attention: false + llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt + low_cpu_fsdp: true + max_crops: 12 + max_position_embeddings: null + max_sequence_length: 4096 + message_formatting: role + mlp_hidden_size: 37888 + mlp_ratio: 4 + moe_capacity_factor: 1.25 + moe_dropless: true + moe_interleave: false + moe_lbl_in_fp32: false + moe_log_expert_assignment: false + moe_loss_weight: 0.1 + moe_mlp_impl: sparse + moe_num_experts: 8 + moe_shared_expert: false + moe_top_k: 2 + moe_zloss_weight: null + multi_annotation_weighting: root_subsegments + n_heads: 28 + n_kv_heads: 4 + n_layers: 28 + new_embedding_init_range: 0.02 + norm_after: false + normalize_input_embeds: false + num_diffusion_inference_steps: 30 + num_diffusion_steps: 1000 + overlap_margins: + - 4 + - 4 + pad_tokenizer: true + pad_value: 0 + precision: amp_bf16 + prompt_type: uber_model + qkv_bias: true + residual_dropout: 0.1 + response_residual_dropout: 0 + rope: true + rope_full_precision: true + rope_theta: 1e+06 + scale_logits: false + system_prompt_kind: demo_or_style + tokenizer: + identifier: Qwen/Qwen2-7B + tokenizer_dir: null + use_col_tokens: true + use_position_ids: true + use_proprio: true + vision_backbone: + attention_dropout: 0 + fsdp_wrap: false + image_default_input_size: + - 336 + - 336 + image_dropout_rate: 0 + image_emb_dim: 1024 + image_head_dim: 64 + image_mlp_activations: quick_gelu + image_mlp_dim: 4096 + image_model_type: openai + image_norm_eps: 1e-05 + image_num_heads: 16 + image_num_key_value_heads: 16 + image_num_layers: 23 + image_num_pos: 577 + image_patch_size: 14 + image_pos_patch_size: 14 + initializer_range: 0.02 + residual_dropout: 0 + resize_mode: default + vit_layers: + - -2 + - -9 + vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt + vocab_size: 152064 + weight_tying: false +multi_component_grad_norm: + value: true +no_pre_train_checkpoint: + value: true +optimizer: + value: + betas: + - 0.9 + - 0.95 + connector_betas: + - 0.9 + - 0.95 + connector_eps: 1e-06 + connector_learning_rate: 0.0002 + connector_weight_decay: 0 + eps: 1e-05 + learning_rate: 0.0001 + llm_betas: + - 0.9 + - 0.95 + llm_eps: 1e-06 + llm_learning_rate: 5e-05 + llm_weight_decay: 0 + metrics_log_interval: 20 + name: adamw + vit_betas: + - 0.9 + - 0.95 + vit_eps: 1e-06 + vit_learning_rate: 6e-06 + vit_weight_decay: 0 + weight_decay: 0.01 +precision: + value: amp_bf16 +python_profiling: + value: false +remote_save_folder: + value: null +reset_dataloader_state: + value: false +reset_optimizer_state: + value: false +reset_trainer_state: + value: false +restore_dataloader: + value: true +run_name: + value: cleandesk50_20251008_163755 +save_dataloader_state: + value: false +save_folder: + value: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk50_flow_matching +save_interval: + value: 500 +save_interval_action_head: + value: 500 +save_interval_ephemeral: + value: null +save_interval_unsharded: + value: 500 +save_num_action_head_checkpoints_to_keep: + value: 2 +save_num_checkpoints_to_keep: + value: 1 +save_num_unsharded_checkpoints_to_keep: + value: 1 +save_overwrite: + value: true +scheduler: + value: + alpha_f: 0.1 + connector_t_warmup: 200 + grad_clip_warmup_factor: null + grad_clip_warmup_steps: null + llm_t_warmup: 2000 + name: multimodal + t_max: null + t_warmup: 100 + units: steps + vit_t_warmup: 2000 + warmup_min_lr: 0 +seed: + value: 6198 +sharded_checkpointer: + value: torch_legacy +softmax_auxiliary_loss: + value: true +softmax_auxiliary_loss_scale: + value: 0.0001 +speed_monitor: + value: + gpu_flops_available: null + window_size: 20 +stop_after: + value: null +stop_at: + value: 500000 +time_limit: + value: null +torch_profiling: + value: false +train_exit_random_layer: + value: false +use_lora: + value: false diff --git a/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/files/output.log b/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/files/output.log new file mode 100644 index 0000000000000000000000000000000000000000..8ed91a15ae1a1ae1e3e6966039b1c1fa737e8183 --- /dev/null +++ b/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/files/output.log @@ -0,0 +1,180 @@ +wandb: Detected [openai] in use. +wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script. +wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/ +10/08 [16:38:36] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109 + device id is provided via `init_process_group` or `barrier `. Using the current device set by the user. + warnings.warn( # warn only once + +****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_CleanDesk50', 8, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 8, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 8, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}} +****** Skip RLDS main; path not found: None +****** start build LeRobot main... +build_tokenizer, cache_dir None tokenizer_dir None +10/08 [16:38:38] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:130 + INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:436 +****** before LeRobot dataset... +****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_CleanDesk50 +****** length of the dataset: 27906 +10/08 [16:38:42] INFO | >> build_rlds_train_dataset: Loading train dataset: vla_dataset_realworld/train __init__.py:519 +****** Import RLDSBatchTransform, RLDSDataset successfully. +****** before RLDS dataset... +****** data_config.rlds_dataset_name: a1_real_world +****** data_config.rlds_data_root_dir: /vast/users/xiaodan/zhangjian/datasets/OXE +214************** +10/08 [16:38:43] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 87212/87212 [00:42<00:00, 2075.20it/s] +214************** +10/08 [16:39:29] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/jaco_play/0.1.0/dataset_statistics_e081d4716a3da95df91c79d661ae59fa26a43da49db4bf8d716b622b56 + 3b0ea3.json. +214************** +10/08 [16:39:30] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/berkeley_cable_routing/0.1.0/dataset_statistics_08cb4c5b7c5e6c035fc84ea85b2d54c0c46ad608a8763 + 4ebb18374088d23cd76.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/viola/0.1.0/dataset_statistics_2415d8f7de73c8761fedd7c2a9590667fb0d3fdd26664bf4c100222e5cdb89 + b9.json. +214************** + INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 1000/1000 [00:04<00:00, 203.13it/s] +214************** +10/08 [16:39:37] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/austin_buds_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_ccecde24cc01793b221 + 4eb0c4c5d7cc0e3ccc623db99bd892b83552b20decfb7.json. +214************** +10/08 [16:39:38] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 456/456 [00:23<00:00, 19.46it/s] +214************** +10/08 [16:40:03] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 5100/5100 [00:57<00:00, 88.60it/s] +214************** +10/08 [16:41:05] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 240/240 [00:08<00:00, 28.55it/s] +214************** +10/08 [16:41:15] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 559/559 [00:01<00:00, 377.56it/s] +214************** +10/08 [16:41:17] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/dlr_edan_shared_control_converted_externally_to_rlds/0.1.0/dataset_statistics_b8984563fc3e7ea + c0803c667ef58c9deaf2e747683568306ea1d83505d532a76.json. +214************** + INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 1500/1500 [00:05<00:00, 254.65it/s] +214************** +10/08 [16:41:24] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/berkeley_fanuc_manipulation/0.1.0/dataset_statistics_a98d349d0364668095ea3ca38c6785e94f35e5e5 + 8e234c88fac83775a923b0d0.json. +214************** +10/08 [16:41:25] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 43264/43264 [00:26<00:00, 1623.73it/s] +214************** +10/08 [16:41:58] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 1995/1995 [00:01<00:00, 1859.15it/s] +214************** +10/08 [16:42:00] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 1003/1003 [00:02<00:00, 406.96it/s] +214************** +10/08 [16:42:03] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 150/150 [00:00<00:00, 1760.96it/s] +214************** +10/08 [16:42:04] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 631/631 [00:01<00:00, 396.82it/s] + +###################################################################################### +# Loading the following 18 datasets (incl. sampling weight): # +# fractal20220817_data: ====================================================0.529250 # +# jaco_play: ===============================================================0.010898 # +# berkeley_cable_routing: ==================================================0.005916 # +# viola: ===================================================================0.021337 # +# berkeley_autolab_ur5: ====================================================0.027379 # +# austin_buds_dataset_converted_externally_to_rlds: ========================0.004768 # +# nyu_franka_play_dataset_converted_externally_to_rlds: ====================0.018817 # +# furniture_bench_dataset_converted_externally_to_rlds: ====================0.055185 # +# austin_sailor_dataset_converted_externally_to_rlds: ======================0.049354 # +# austin_sirius_dataset_converted_externally_to_rlds: ======================0.039129 # +# dlr_edan_shared_control_converted_externally_to_rlds: ====================0.001248 # +# utaustin_mutex: ==========================================================0.050583 # +# berkeley_fanuc_manipulation: =============================================0.017504 # +# bc_z: ====================================================================0.168166 # +# roboturk: ================================================================0.000131 # +# toto: ====================================================================0.000228 # +# ucsd_kitchen_dataset_converted_externally_to_rlds: =======================0.000006 # +# iamlab_cmu_pickup_insert_converted_externally_to_rlds: ===================0.000102 # +###################################################################################### + +10/08 [16:42:06] INFO | >> [*] Threads per Dataset: [14 1 1 1 1 1 1 2 1 1 1 1 1 5 1 1 1 1] dataset.py:563 + INFO | >> [*] Reads per Dataset: [14 1 1 1 1 1 1 2 1 1 1 1 1 5 1 1 1 1] dataset.py:564 + INFO | >> [*] Constructing datasets... dataset.py:567 +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +10/08 [16:42:11] INFO | >> [*] Applying frame transforms on dataset... dataset.py:607 +****** after RLDSDataset initialization! +****** length of the dataset: 7154275 +****** Build rlds train dataset: IterableDatasetWrapper successfully. +****** path: None +****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None +****** After build vla train dataset... +****** iterable_sources: [, ] +****** Before build mixed iterable dataset... +****** Build vla train dataloader successfully! +************************* Build train_dataloader successful! +************************* Before build_inf_evaluators + WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109 + device id is provided via `init_process_group` or `barrier `. Using the current device set by the user. + warnings.warn( # warn only once + +************************* Build evaluators successful! +************************* Early exit flags: early_exit=False +PROPRIO_DIM 16 does not match ACTION_DIM 16 for AffordVLA +************************* Initialize model successful! +***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt +***** Load checkpoint successful! +missing keys: ['action_head.state_proj.weight', 'action_head.state_proj.bias', 'action_head.action_in_proj.weight', 'action_head.action_in_proj.bias', 'action_head.action_time_in.weight', 'action_head.action_time_in.bias', 'action_head.action_time_out.weight', 'action_head.action_time_out.bias', 'action_head.memory_proj.weight', 'action_head.memory_proj.bias', 'action_head.gemma.model.layers.0.self_attn.q_proj.weight', 'action_head.gemma.model.layers.0.self_attn.k_proj.weight', 'action_head.gemma.model.layers.0.self_attn.v_proj.weight', 'action_head.gemma.model.layers.0.self_attn.o_proj.weight', 'action_head.gemma.model.layers.0.mlp.gate_proj.weight', 'action_head.gemma.model.layers.0.mlp.up_proj.weight', 'action_head.gemma.model.layers.0.mlp.down_proj.weight', 'action_head.gemma.model.layers.0.input_layernorm.weight', 'action_head.gemma.model.layers.0.post_attention_layernorm.weight', 'action_head.gemma.model.layers.1.self_attn.q_proj.weight', 'action_head.gemma.model.layers.1.self_attn.k_proj.weight', 'action_head.gemma.model.layers.1.self_attn.v_proj.weight', 'action_head.gemma.model.layers.1.self_attn.o_proj.weight', 'action_head.gemma.model.layers.1.mlp.gate_proj.weight', 'action_head.gemma.model.layers.1.mlp.up_proj.weight', 'action_head.gemma.model.layers.1.mlp.down_proj.weight', 'action_head.gemma.model.layers.1.input_layernorm.weight', 'action_head.gemma.model.layers.1.post_attention_layernorm.weight', 'action_head.gemma.model.layers.2.self_attn.q_proj.weight', 'action_head.gemma.model.layers.2.self_attn.k_proj.weight', 'action_head.gemma.model.layers.2.self_attn.v_proj.weight', 'action_head.gemma.model.layers.2.self_attn.o_proj.weight', 'action_head.gemma.model.layers.2.mlp.gate_proj.weight', 'action_head.gemma.model.layers.2.mlp.up_proj.weight', 'action_head.gemma.model.layers.2.mlp.down_proj.weight', 'action_head.gemma.model.layers.2.input_layernorm.weight', 'action_head.gemma.model.layers.2.post_attention_layernorm.weight', 'action_head.gemma.model.layers.3.self_attn.q_proj.weight', 'action_head.gemma.model.layers.3.self_attn.k_proj.weight', 'action_head.gemma.model.layers.3.self_attn.v_proj.weight', 'action_head.gemma.model.layers.3.self_attn.o_proj.weight', 'action_head.gemma.model.layers.3.mlp.gate_proj.weight', 'action_head.gemma.model.layers.3.mlp.up_proj.weight', 'action_head.gemma.model.layers.3.mlp.down_proj.weight', 'action_head.gemma.model.layers.3.input_layernorm.weight', 'action_head.gemma.model.layers.3.post_attention_layernorm.weight', 'action_head.gemma.model.layers.4.self_attn.q_proj.weight', 'action_head.gemma.model.layers.4.self_attn.k_proj.weight', 'action_head.gemma.model.layers.4.self_attn.v_proj.weight', 'action_head.gemma.model.layers.4.self_attn.o_proj.weight', 'action_head.gemma.model.layers.4.mlp.gate_proj.weight', 'action_head.gemma.model.layers.4.mlp.up_proj.weight', 'action_head.gemma.model.layers.4.mlp.down_proj.weight', 'action_head.gemma.model.layers.4.input_layernorm.weight', 'action_head.gemma.model.layers.4.post_attention_layernorm.weight', 'action_head.gemma.model.layers.5.self_attn.q_proj.weight', 'action_head.gemma.model.layers.5.self_attn.k_proj.weight', 'action_head.gemma.model.layers.5.self_attn.v_proj.weight', 'action_head.gemma.model.layers.5.self_attn.o_proj.weight', 'action_head.gemma.model.layers.5.mlp.gate_proj.weight', 'action_head.gemma.model.layers.5.mlp.up_proj.weight', 'action_head.gemma.model.layers.5.mlp.down_proj.weight', 'action_head.gemma.model.layers.5.input_layernorm.weight', 'action_head.gemma.model.layers.5.post_attention_layernorm.weight', 'action_head.gemma.model.layers.6.self_attn.q_proj.weight', 'action_head.gemma.model.layers.6.self_attn.k_proj.weight', 'action_head.gemma.model.layers.6.self_attn.v_proj.weight', 'action_head.gemma.model.layers.6.self_attn.o_proj.weight', 'action_head.gemma.model.layers.6.mlp.gate_proj.weight', 'action_head.gemma.model.layers.6.mlp.up_proj.weight', 'action_head.gemma.model.layers.6.mlp.down_proj.weight', 'action_head.gemma.model.layers.6.input_layernorm.weight', 'action_head.gemma.model.layers.6.post_attention_ +unexpected keys: [] +************************* Initialize model successful! +************************* Before FSDP model wrapping +************************* FSDP model wrapping successful! +************************* Before building optimizer and scheduler +10/08 [16:43:47] INFO | >> Constructing optimizer with 2 param groups optim.py:1283 +************************************************** +After building optimizer and scheduler and model, before training, peak GPU memory (MB): 36856 +************************* VLATrainer initialized successfully! +************************* Before trainer.fit() +Pre-train system metrics + System/Peak GPU Memory (MB)=36,856 +10/08 [16:43:57] WARNING | >> /vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py:200: UserWarning: To copy construct from a tensor, it is recommended to use warnings.py:109 + sourceTensor.detach().clone() or sourceTensor.detach().clone().requires_grad_(True), rather than torch.tensor(sourceTensor). + timestep_list = [torch.tensor(ex["timestep"], dtype=torch.int64) for ex in batch] + +!!!Training failed: stack expects each tensor to be equal size, but got [] at entry 0 and [1] at entry 1 +Traceback (most recent call last): + File "/vast/users/xiaodan/zhangjian/A1/scripts/train_for_action.py", line 593, in main + trainer.fit() + File "/vast/users/xiaodan/zhangjian/A1/olmo/train.py", line 2284, in fit + for batch in self.train_loader: + File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/utils/data/dataloader.py", line 734, in __next__ + data = self._next_data() + File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/utils/data/dataloader.py", line 790, in _next_data + data = self._dataset_fetcher.fetch(index) # may raise StopIteration + File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/utils/data/_utils/fetch.py", line 43, in fetch + return self.collate_fn(data) + File "/vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py", line 201, in __call__ + out['timestep'] = torch.stack(timestep_list, dim=0) +RuntimeError: stack expects each tensor to be equal size, but got [] at entry 0 and [1] at entry 1 +wandb: WARNING The `quiet` argument to `wandb.run.finish()` is deprecated, use `wandb.Settings(quiet=...)` to set this instead. diff --git a/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/files/requirements.txt b/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/files/requirements.txt new file mode 100644 index 0000000000000000000000000000000000000000..5a5e971a5d9f3b6f6a75248e203682c5fbcd69e8 --- /dev/null +++ b/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/files/requirements.txt @@ -0,0 +1,286 @@ +ai2-molmo==0.0.0 +astunparse==1.6.3 +flatbuffers==25.2.10 +gast==0.6.0 +google-pasta==0.2.0 +h5py==3.14.0 +libclang==18.1.1 +Markdown==3.9 +namex==0.1.0 +opt_einsum==3.4.0 +optree==0.17.0 +tensorboard-data-server==0.7.2 +tensorflow-io-gcs-filesystem==0.37.1 +termcolor==3.1.0 +Werkzeug==3.1.3 +Brotli==1.1.0 +Farama-Notifications==0.0.4 +MarkupSafe==2.1.5 +PyYAML==6.0.2 +absl-py==2.3.1 +accelerate==1.10.1 +ai2-molmo==0.0.0 +aiofiles==24.1.0 +aiohappyeyeballs==2.6.1 +aiohttp==3.12.15 +aiosignal==1.4.0 +annotated-types==0.7.0 +antlr4-python3-runtime==4.9.3 +anyio==4.10.0 +array_record==0.8.1 +async-timeout==5.0.1 +attrs==25.3.0 +av==15.1.0 +backports.tarfile==1.2.0 +beaker-gantry==3.2.0 +beaker-py==2.5.0 +black==23.12.1 +blinker==1.9.0 +boltons==25.0.0 +boto3==1.40.33 +botocore==1.40.33 +build==1.3.0 +cached_path==1.7.3 +cached-property==2.0.1 +cachetools==5.5.2 +certifi==2025.8.3 +cffi==2.0.0 +charset-normalizer==3.4.3 +click==8.2.1 +click-help-colors==0.9.4 +click-option-group==0.5.7 +cloudpickle==3.1.1 +cmake==4.1.0 +contourpy==1.3.2 +cryptography==46.0.1 +cycler==0.12.1 +dataclass-extensions==0.2.3 +datasets==3.6.0 +decorator==5.2.1 +deepdiff==8.6.1 +diffusers==0.35.1 +dill==0.3.8 +distro==1.9.0 +dlimp==0.0.1 +dm-tree==0.1.9 +docutils==0.22.1 +draccus==0.10.0 +editdistance==0.8.1 +einops==0.8.1 +einops-exts==0.0.4 +et_xmlfile==2.0.0 +etils==1.13.0 +evdev==1.9.2 +exceptiongroup==1.3.0 +face==24.0.0 +fastapi==0.116.2 +ffmpy==0.6.1 +fiddle==0.3.0 +filelock==3.13.1 +Flask==3.1.2 +fonttools==4.60.0 +frozenlist==1.7.0 +fsspec==2023.9.2 +ftfy==6.3.1 +gcsfs==2023.9.2 +gitdb==4.0.12 +GitPython==3.1.45 +glom==24.11.0 +google-api-core==2.25.1 +google-auth==2.40.3 +google-auth-oauthlib==1.2.2 +google-cloud-core==2.4.3 +google-cloud-storage==2.19.0 +google-crc32c==1.7.1 +google-resumable-media==2.7.2 +googleapis-common-protos==1.70.0 +gradio==5.46.0 +gradio_client==1.13.0 +graphviz==0.21 +groovy==0.1.2 +grpcio==1.75.0 +gymnasium==0.29.1 +h11==0.16.0 +hf_transfer==0.1.9 +hf-xet==1.1.10 +httpcore==1.0.9 +httpx==0.28.1 +huggingface-hub==0.35.0 +id==1.5.0 +idna==3.10 +imageio==2.37.0 +imageio-ffmpeg==0.6.0 +importlib_metadata==8.7.0 +importlib_resources==6.5.2 +iniconfig==2.1.0 +inquirerpy==0.3.4 +isort==5.12.0 +itsdangerous==2.2.0 +jaraco.classes==3.4.0 +jaraco.context==6.0.1 +jaraco.functools==4.3.0 +jeepney==0.9.0 +Jinja2==3.1.4 +jiter==0.11.0 +jmespath==1.0.1 +joblib==1.5.2 +jsonlines==4.0.0 +keras==2.15.0 +keyring==25.6.0 +kiwisolver==1.4.9 +latex2sympy2_extended==1.10.2 +lerobot==0.3.4 +Levenshtein==0.27.1 +libcst==1.8.4 +lightning-utilities==0.15.2 +markdown-it-py==4.0.0 +math-verify==0.8.0 +matplotlib==3.10.6 +mdurl==0.1.2 +mergedeep==1.3.4 +ml-dtypes==0.2.0 +ml_dtypes==0.5.3 +more-itertools==10.8.0 +mpmath==1.3.0 +msgspec==0.19.0 +multidict==6.6.4 +multiprocess==0.70.16 +mypy==1.3.0 +mypy_extensions==1.1.0 +necessary==0.4.3 +networkx==3.3 +nh3==0.3.0 +nltk==3.9.1 +numpy==1.26.4 +oauthlib==3.3.1 +omegaconf==2.3.0 +openai==1.108.0 +opencv-python-headless==4.12.0.88 +OpenEXR==3.4.0 +openpyxl==3.1.5 +orderly-set==5.5.0 +orjson==3.11.3 +packaging==25.0 +pandas==2.3.2 +pathspec==0.12.1 +petname==2.6 +pfzy==0.3.4 +pillow==11.0.0 +pip==25.2 +platformdirs==4.4.0 +pluggy==1.6.0 +promise==2.3 +prompt_toolkit==3.0.52 +propcache==0.3.2 +proto-plus==1.26.1 +protobuf==4.21.12 +protobuf==6.32.1 +psutil==7.1.0 +pyarrow==21.0.0 +pyasn1==0.6.1 +pyasn1_modules==0.4.2 +pycparser==2.23 +pydantic==2.11.9 +pydantic_core==2.33.2 +pydub==0.25.1 +Pygments==2.19.2 +pynput==1.8.1 +pyparsing==3.2.4 +pyproject_hooks==1.2.0 +pyserial==3.5 +pytest==8.4.2 +pytest-sphinx==0.6.3 +python-dateutil==2.9.0.post0 +python-Levenshtein==0.27.1 +python-multipart==0.0.20 +python-xlib==0.33 +pytorch-triton-rocm==3.4.0 +pytz==2025.2 +pyyaml-include==1.4.1 +RapidFuzz==3.14.1 +readme_renderer==44.0 +regex==2025.9.1 +requests==2.32.5 +requests-oauthlib==2.0.0 +requests-toolbelt==1.0.0 +requirements-parser==0.13.0 +rerun-sdk==0.22.1 +rfc3986==2.0.0 +rich==13.9.4 +rsa==4.9.1 +ruff==0.13.0 +s3transfer==0.14.0 +safehttpx==0.1.6 +safetensors==0.6.2 +scikit-learn==1.7.2 +scipy==1.15.3 +SecretStorage==3.4.0 +semantic-version==2.10.0 +sentencepiece==0.2.1 +sentry-sdk==2.38.0 +setuptools==78.1.1 +shellingham==1.5.4 +six==1.17.0 +smart_open==7.3.1 +smashed==0.21.5 +smmap==5.0.2 +sniffio==1.3.1 +starlette==0.48.0 +sympy==1.13.3 +tensorboard==2.15.2 +tensorboard==2.19.0 +tensorflow==2.15.0 +tensorflow-addons==0.23.0 +tensorflow-datasets==4.9.3 +tensorflow-estimator==2.15.0 +tensorflow-graphics==2021.12.3 +tensorflow-metadata==1.17.2 +threadpoolctl==3.6.0 +timm==1.0.19 +tokenizers==0.22.0 +toml==0.10.2 +tomli==2.2.1 +tomlkit==0.13.3 +torch==2.8.0+rocm6.4 +torchcodec==0.5 +torchmetrics==1.8.2 +torchvision==0.23.0+rocm6.4 +tqdm==4.67.1 +transformers==4.56.1 +trimesh==4.8.2 +trouting==0.3.3 +twine==6.2.0 +typeguard==2.13.3 +typer==0.17.4 +typing_extensions==4.15.0 +typing-inspect==0.9.0 +typing-inspection==0.4.1 +tzdata==2025.2 +urllib3==2.5.0 +uvicorn==0.35.0 +wandb==0.21.4 +wcwidth==0.2.13 +websockets==15.0.1 +wheel==0.45.1 +wrapt==1.14.2 +xxhash==3.5.0 +yarl==1.20.1 +zipp==3.23.0 +lerobot==0.3.4 +minLoRA==0.1.0 +autocommand==2.2.2 +backports.tarfile==1.2.0 +importlib_metadata==8.0.0 +inflect==7.3.1 +jaraco.collections==5.1.0 +jaraco.context==5.3.0 +jaraco.functools==4.0.1 +jaraco.text==3.12.1 +more-itertools==10.3.0 +packaging==24.2 +platformdirs==4.2.2 +tomli==2.0.1 +typeguard==4.3.0 +typing_extensions==4.12.2 +wheel==0.45.1 +zipp==3.19.2 diff --git a/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/files/wandb-metadata.json b/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/files/wandb-metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..49b2bb13bfeb9e08c7be000e79c1ccbbee1753c7 --- /dev/null +++ b/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/files/wandb-metadata.json @@ -0,0 +1,204 @@ +{ + "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35", + "python": "CPython 3.10.18", + "startedAt": "2025-10-08T16:38:34.545687Z", + "args": [ + "qwen2_7b", + "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk50_flow_matching", + "--vision_backbone", + "openai", + "--action_head", + "flow_matching", + "--seq_len", + "1600", + "--ft_llm", + "--checkpoint", + "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924", + "--device_train_microbatch_size", + "16", + "--global_batch_size", + "126", + "--dataset", + "vla_dataset_realworld", + "--llm_learning_rate", + "5e-5", + "--wandb_entity", + "henryeap", + "--wandb_project", + "a1-realworld", + "--wandb_run_name", + "cleandesk50", + "--real_world_vla_config_path", + "vla_config_realworld/vla_config_cleandesk50.yaml", + "--save_overwrite" + ], + "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py", + "codePath": "launch_scripts/train_vla.py", + "codePathLocal": "launch_scripts/train_vla.py", + "git": { + "remote": "https://github.com/Spatialtemporal-AI/A1.git", + "commit": "49712a42d21a8c739a16ba5eeaec4a0d7b29ab80" + }, + "email": "ihenrykwok@outlook.com", + "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk50_flow_matching/wandb", + "host": "auh7-1b-gpu-319", + "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10", + "cpu_count": 64, + "cpu_count_logical": 128, + "gpu": "Instinct MI210", + "gpu_count": 8, + "disk": { + "/": { + "total": "470343073792", + "used": "50988601344" + } + }, + "memory": { + "total": "2434606960640" + }, + "gpu_amd": [ + { + "id": "1", + "uniqueId": "0x75d378aea8d8934d", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "4", + "uniqueId": "0x328cfe1d1a9d2b38", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "6", + "uniqueId": "0x3c4f0005790d7da3", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "0", + "uniqueId": "0x763c831cad37d9b", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "3", + "uniqueId": "0x697c203d8e63f05b", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "7", + "uniqueId": "0x91078b09ae9b0757", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "2", + "uniqueId": "0x2433899c197738b6", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "5", + "uniqueId": "0x2bc0f4cfe424c12a", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + } + ], + "slurm": { + "cluster_name": "ai-04r", + "conf": "/etc/slurm/slurm.conf", + "cpus_on_node": "128", + "gpus_on_node": "8", + "gtids": "0", + "job_account": "faculty-acc", + "job_cpus_per_node": "128", + "job_end_time": "1760200645", + "job_gid": "2000", + "job_gpus": "0,1,2,3,4,5,6,7", + "job_id": "2283", + "job_name": "mh_cleandesk50_flow_matching", + "job_nodelist": "auh7-1b-gpu-319", + "job_num_nodes": "1", + "job_partition": "faculty", + "job_qos": "xdqos", + "job_start_time": "1759941445", + "job_uid": "2013", + "job_user": "xiaodan", + "jobid": "2283", + "localid": "0", + "nnodes": "1", + "nodeid": "0", + "nodelist": "auh7-1b-gpu-319", + "nprocs": "1", + "ntasks": "1", + "ntasks_per_node": "1", + "oom_kill_step": "0", + "prio_process": "0", + "procid": "0", + "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts", + "submit_host": "auh-1b-cpu-login-001", + "task_pid": "152784", + "tasks_per_node": "1", + "topology_addr": "auh7-1b-gpu-319", + "topology_addr_pattern": "node" + }, + "writerId": "yfehyqgufhcu23nx6cclbs2foj5p3ccp" +} \ No newline at end of file diff --git a/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/files/wandb-summary.json b/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/files/wandb-summary.json new file mode 100644 index 0000000000000000000000000000000000000000..1a8df177e389cba9a1dc5de730e047da1f1617ad --- /dev/null +++ b/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/files/wandb-summary.json @@ -0,0 +1 @@ +{"_timestamp":1.7599418275553412e+09,"_wandb":{"runtime":323},"_runtime":323.700364245,"_step":0,"System/Peak GPU Memory (MB)":36856.41796875} \ No newline at end of file diff --git a/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/logs/debug-core.log b/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/logs/debug-core.log new file mode 100644 index 0000000000000000000000000000000000000000..f995cde09b9f448bdf0318f021c4efa8bdc4d87f --- /dev/null +++ b/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/logs/debug-core.log @@ -0,0 +1,16 @@ +{"time":"2025-10-08T16:38:34.695045626Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmp3fc8cjxs/port-152974.txt","pid":152974,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false} +{"time":"2025-10-08T16:38:34.696250464Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":152974} +{"time":"2025-10-08T16:38:34.696200463Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-152974-153157-1697716542/socket","Net":"unix"}} +{"time":"2025-10-08T16:38:34.795279742Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"} +{"time":"2025-10-08T16:38:34.805004585Z","level":"INFO","msg":"handleInformInit: received","streamId":"quokv8gn","id":"1(@)"} +{"time":"2025-10-08T16:38:35.952704891Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"quokv8gn","id":"1(@)"} +{"time":"2025-10-08T16:44:01.423240817Z","level":"INFO","msg":"handleInformFinish: finish message received","streamId":"quokv8gn","id":"1(@)"} +{"time":"2025-10-08T16:44:01.426683567Z","level":"INFO","msg":"handleInformFinish: stream closed","streamId":"quokv8gn","id":"1(@)"} +{"time":"2025-10-08T16:44:01.48018829Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"} +{"time":"2025-10-08T16:44:01.48022619Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"} +{"time":"2025-10-08T16:44:01.48023591Z","level":"INFO","msg":"connection: closing","id":"1(@)"} +{"time":"2025-10-08T16:44:01.480247021Z","level":"INFO","msg":"server is shutting down"} +{"time":"2025-10-08T16:44:01.480274301Z","level":"INFO","msg":"connection: closed successfully","id":"1(@)"} +{"time":"2025-10-08T16:44:01.480277991Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"} +{"time":"2025-10-08T16:44:01.480326482Z","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-152974-153157-1697716542/socket","Net":"unix"}} +{"time":"2025-10-08T16:44:01.480358322Z","level":"INFO","msg":"server is closed"} diff --git a/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/logs/debug-internal.log b/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/logs/debug-internal.log new file mode 100644 index 0000000000000000000000000000000000000000..8994a86d9e8db1039a6826879c432376be5640d5 --- /dev/null +++ b/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/logs/debug-internal.log @@ -0,0 +1,12 @@ +{"time":"2025-10-08T16:38:34.806823131Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"} +{"time":"2025-10-08T16:38:35.95264112Z","level":"INFO","msg":"stream: created new stream","id":"quokv8gn"} +{"time":"2025-10-08T16:38:35.952698801Z","level":"INFO","msg":"stream: started","id":"quokv8gn"} +{"time":"2025-10-08T16:38:35.952731371Z","level":"INFO","msg":"sender: started","stream_id":"quokv8gn"} +{"time":"2025-10-08T16:38:35.952734591Z","level":"INFO","msg":"writer: started","stream_id":"quokv8gn"} +{"time":"2025-10-08T16:38:35.952725981Z","level":"INFO","msg":"handler: started","stream_id":"quokv8gn"} +{"time":"2025-10-08T16:43:59.99384105Z","level":"INFO","msg":"handler: operation stats","stats":{"operations":[{"desc":"updating run metadata","runtime_seconds":0.001054985}],"total_operations":1}} +{"time":"2025-10-08T16:44:01.036808965Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"} +{"time":"2025-10-08T16:44:01.423613682Z","level":"INFO","msg":"stream: closing","id":"quokv8gn"} +{"time":"2025-10-08T16:44:01.423631393Z","level":"INFO","msg":"handler: closed","stream_id":"quokv8gn"} +{"time":"2025-10-08T16:44:01.425219996Z","level":"INFO","msg":"sender: closed","stream_id":"quokv8gn"} +{"time":"2025-10-08T16:44:01.425239166Z","level":"INFO","msg":"stream: closed","id":"quokv8gn"} diff --git a/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/logs/debug.log b/cleandesk50_flow_matching/wandb/wandb/run-20251008_163834-quokv8gn/logs/debug.log new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/cleandesk50_l1_regression/wandb/wandb/debug-internal.log b/cleandesk50_l1_regression/wandb/wandb/debug-internal.log new file mode 100644 index 0000000000000000000000000000000000000000..66a0fb2bb4c67d7f04a61c0c9f52c0db563747b5 --- /dev/null +++ b/cleandesk50_l1_regression/wandb/wandb/debug-internal.log @@ -0,0 +1,12 @@ +{"time":"2025-10-08T16:38:31.726288089Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"} +{"time":"2025-10-08T16:38:33.081399086Z","level":"INFO","msg":"stream: created new stream","id":"fqdwkc8m"} +{"time":"2025-10-08T16:38:33.081437966Z","level":"INFO","msg":"stream: started","id":"fqdwkc8m"} +{"time":"2025-10-08T16:38:33.081464946Z","level":"INFO","msg":"sender: started","stream_id":"fqdwkc8m"} +{"time":"2025-10-08T16:38:33.081464936Z","level":"INFO","msg":"writer: started","stream_id":"fqdwkc8m"} +{"time":"2025-10-08T16:38:33.081488306Z","level":"INFO","msg":"handler: started","stream_id":"fqdwkc8m"} +{"time":"2025-10-08T16:44:35.233389442Z","level":"INFO","msg":"handler: operation stats","stats":{"operations":[{"desc":"updating run metadata","runtime_seconds":0.00059375}],"total_operations":1}} +{"time":"2025-10-08T16:44:37.058187164Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"} +{"time":"2025-10-08T16:44:37.412033949Z","level":"INFO","msg":"stream: closing","id":"fqdwkc8m"} +{"time":"2025-10-08T16:44:37.412048989Z","level":"INFO","msg":"handler: closed","stream_id":"fqdwkc8m"} +{"time":"2025-10-08T16:44:37.4130748Z","level":"INFO","msg":"sender: closed","stream_id":"fqdwkc8m"} +{"time":"2025-10-08T16:44:37.41308173Z","level":"INFO","msg":"stream: closed","id":"fqdwkc8m"} diff --git a/cleandesk50_l1_regression/wandb/wandb/debug.log b/cleandesk50_l1_regression/wandb/wandb/debug.log new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/files/config.yaml b/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/files/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..c9f62b30203b6072d424e762a252e57c3c479c8b --- /dev/null +++ b/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/files/config.yaml @@ -0,0 +1,623 @@ +_wandb: + value: + cli_version: 0.21.4 + e: + da16lrefa3ue6fcq4audbkzfio2vskvf: + args: + - qwen2_7b + - save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk50_l1_regression + - --vision_backbone + - openai + - --action_head + - l1_regression + - --seq_len + - "1600" + - --ft_llm + - --checkpoint + - /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924 + - --device_train_microbatch_size + - "16" + - --global_batch_size + - "126" + - --dataset + - vla_dataset_realworld + - --llm_learning_rate + - "5e-5" + - --wandb_entity + - henryeap + - --wandb_project + - a1-realworld + - --wandb_run_name + - cleandesk50 + - --real_world_vla_config_path + - vla_config_realworld/vla_config_cleandesk50.yaml + - --save_overwrite + codePath: launch_scripts/train_vla.py + codePathLocal: launch_scripts/train_vla.py + cpu_count: 64 + cpu_count_logical: 128 + disk: + /: + total: "470343073792" + used: "52340371456" + email: ihenrykwok@outlook.com + executable: /vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10 + git: + commit: 49712a42d21a8c739a16ba5eeaec4a0d7b29ab80 + remote: https://github.com/Spatialtemporal-AI/A1.git + gpu: Instinct MI210 + gpu_amd: + - id: "7" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0x21a2e88d06c419dc" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "4" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0xa515afd8ced1d39d" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "2" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0x399226d2b2bfa544" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "6" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0xfa8b85a4625b04f" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "3" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0xf61ec17df11883bd" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "1" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0x9b5c1c302c8129f8" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "0" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0x3558c3014c813fdb" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "5" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0x137c9ede1bb1518e" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + gpu_count: 8 + host: auh7-1b-gpu-188 + memory: + total: "2434606964736" + os: Linux-5.15.0-140-generic-x86_64-with-glibc2.35 + program: /vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py + python: CPython 3.10.18 + root: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk50_l1_regression/wandb + slurm: + cluster_name: ai-04r + conf: /etc/slurm/slurm.conf + cpus_on_node: "128" + gpus_on_node: "8" + gtids: "0" + job_account: faculty-acc + job_cpus_per_node: "128" + job_end_time: "1760200645" + job_gid: "2000" + job_gpus: 0,1,2,3,4,5,6,7 + job_id: "2284" + job_name: mh_cleandesk50_l1_regression + job_nodelist: auh7-1b-gpu-188 + job_num_nodes: "1" + job_partition: faculty + job_qos: xdqos + job_start_time: "1759941445" + job_uid: "2013" + job_user: xiaodan + jobid: "2284" + localid: "0" + nnodes: "1" + nodeid: "0" + nodelist: auh7-1b-gpu-188 + nprocs: "1" + ntasks: "1" + ntasks_per_node: "1" + oom_kill_step: "0" + prio_process: "0" + procid: "0" + submit_dir: /vast/users/xiaodan/zhangjian/A1/launch_scripts + submit_host: auh-1b-cpu-login-001 + task_pid: "2621518" + tasks_per_node: "1" + topology_addr: auh7-1b-gpu-188 + topology_addr_pattern: node + startedAt: "2025-10-08T16:38:31.458924Z" + writerId: da16lrefa3ue6fcq4audbkzfio2vskvf + m: [] + python_version: 3.10.18 + t: + "1": + - 1 + - 2 + - 3 + - 5 + - 11 + - 41 + - 49 + - 51 + - 53 + - 63 + - 71 + - 83 + - 95 + - 105 + "2": + - 1 + - 2 + - 3 + - 5 + - 11 + - 41 + - 49 + - 51 + - 53 + - 63 + - 71 + - 83 + - 95 + - 105 + "3": + - 2 + - 13 + - 15 + - 16 + - 61 + "4": 3.10.18 + "5": 0.21.4 + "6": 4.56.1 + "10": + - 19 + "12": 0.21.4 + "13": linux-x86_64 +activation_checkpointing: + value: whole_layer +allow_resume: + value: false +batch_divisor: + value: global_batch +canceled_check_interval: + value: 50 +checkpoint_dir: + value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924 +compile: + value: null +console_log_interval: + value: 1 +data: + value: + dataset: vla_dataset_realworld + drop_last: true + for_inference: false + lerobot_episode_index_end: null + lerobot_episode_index_start: null + mixture: null + multi_modal: torch + num_workers: 0 + pad: to_max + persistent_workers: false + pin_memory: true + prefetch_factor: null + rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds + rlds_dataset_name: libero_4_task_suites_no_noops + rlds_read_threads: 8 + rlds_shuffle_buffer_size: 100000 + rlds_traj_threads: 8 + root_size_mixture: null + seed: 95818 + sequence_length: 1600 + shuffle: true + shuffle_messages: false + split: train + timeout: 0 + use_proprio: true + use_wrist_image: true +device_eval_batch_size: + value: 4 +device_inf_eval_batch_size: + value: 16 +device_train_batch_size: + value: 15 +device_train_grad_accum: + value: 0 +device_train_microbatch_size: + value: 16 +dry_run: + value: false +early_exit: + value: false +epoch: + value: null +eval_interval: + value: 0 +eval_on_load: + value: false +eval_subset_num_batches: + value: -1 +evaluators: + value: + - data: + dataset: vla_dataset_realworld + drop_last: true + for_inference: false + lerobot_episode_index_end: 765 + lerobot_episode_index_start: 353 + mixture: null + multi_modal: torch + num_workers: 0 + pad: to_max + persistent_workers: true + pin_memory: true + prefetch_factor: null + rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds + rlds_dataset_name: libero_4_task_suites_no_noops + rlds_read_threads: 8 + rlds_shuffle_buffer_size: 256000 + rlds_traj_threads: 8 + root_size_mixture: null + seed: null + sequence_length: 1600 + shuffle: false + shuffle_messages: false + split: validation + timeout: 0 + use_proprio: true + use_wrist_image: true + device_eval_batch_size: null + eval_name: null + label: val + max_examples: null + max_new_tokens: 448 + mm_evaluator: null + save_dir: null + save_to_checkpoint_dir: false + skip_if_metrics_cached: true + subset_num_batches: 64 +extra_steps_after_cancel: + value: 10 +fast_forward_batches: + value: null +force_save_unsharded: + value: false +fsdp: + value: + hybrid_sharding_num_model_replicas: null + precision: float + sharding_strategy: FULL_SHARD + use_orig_params: true + wrapping_strategy: by_block_and_size +ft_connector: + value: false +ft_embedding: + value: lm_head +ft_llm: + value: true +ft_vit: + value: false +fused_loss: + value: null +gen1_gc_interval: + value: 1 +global_train_batch_size: + value: 126 +inf_eval_interval: + value: -1 +inf_eval_subset_num_batches: + value: -1 +inf_evaluators: + value: [] +initial_model_checkpoint: + value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924 +keep_lr_on_load: + value: true +load_model_config: + value: null +load_path: + value: null +load_path_sharded_checkpointer: + value: null +lora: + value: false +lora_connector: + value: false +lora_llm: + value: false +lora_rank: + value: 8 +lora_vit: + value: false +max_duration: + value: 500000 +max_grad_norm: + value: 1 +max_grad_norm_ratio: + value: null +model: + value: + action_dim: 7 + action_head: l1_regression + action_head_dit_depth: 28 + action_head_dit_hidden_size: 1152 + action_head_dit_num_heads: 16 + action_tokenizer: + identifier: physical-intelligence/fast + tokenizer_dir: null + action_use_left_eef: true + action_use_mobile_base: false + activation_type: swiglu + additional_vocab_size: 128 + always_start_with_space: true + attention_dropout: 0 + attention_layer_norm: false + attention_layer_norm_with_affine: true + attention_type: sdpa + bias_for_layer_norm: null + block_group_size: 1 + block_type: sequential + clip_qkv: null + crop_mode: overlap-and-resize-c2 + d_model: 3584 + default_inference_len: 65 + embedding_dropout: 0 + embedding_size: 152064 + ff_out_size: null + fix_image_padding: true + float32_attention: true + head_dim: null + horizon: 8 + image_feature_dropout: 0 + image_padding_embed: pad_and_partial_pad + image_pooling_2d: attention_meanq + image_pooling_h: 2 + image_pooling_w: 2 + image_projector: mlp + include_bias: false + init_cutoff_factor: null + init_device: null + init_fn: normal + init_std: 0.02 + initializer_range: 0.02 + layer_norm_eps: 1e-06 + layer_norm_type: rms + layer_norm_with_affine: true + llm_causal_attention: false + llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt + low_cpu_fsdp: true + max_crops: 12 + max_position_embeddings: null + max_sequence_length: 4096 + message_formatting: role + mlp_hidden_size: 37888 + mlp_ratio: 4 + moe_capacity_factor: 1.25 + moe_dropless: true + moe_interleave: false + moe_lbl_in_fp32: false + moe_log_expert_assignment: false + moe_loss_weight: 0.1 + moe_mlp_impl: sparse + moe_num_experts: 8 + moe_shared_expert: false + moe_top_k: 2 + moe_zloss_weight: null + multi_annotation_weighting: root_subsegments + n_heads: 28 + n_kv_heads: 4 + n_layers: 28 + new_embedding_init_range: 0.02 + norm_after: false + normalize_input_embeds: false + num_diffusion_inference_steps: 30 + num_diffusion_steps: 1000 + overlap_margins: + - 4 + - 4 + pad_tokenizer: true + pad_value: 0 + precision: amp_bf16 + prompt_type: uber_model + qkv_bias: true + residual_dropout: 0.1 + response_residual_dropout: 0 + rope: true + rope_full_precision: true + rope_theta: 1e+06 + scale_logits: false + system_prompt_kind: demo_or_style + tokenizer: + identifier: Qwen/Qwen2-7B + tokenizer_dir: null + use_col_tokens: true + use_position_ids: true + use_proprio: true + vision_backbone: + attention_dropout: 0 + fsdp_wrap: false + image_default_input_size: + - 336 + - 336 + image_dropout_rate: 0 + image_emb_dim: 1024 + image_head_dim: 64 + image_mlp_activations: quick_gelu + image_mlp_dim: 4096 + image_model_type: openai + image_norm_eps: 1e-05 + image_num_heads: 16 + image_num_key_value_heads: 16 + image_num_layers: 23 + image_num_pos: 577 + image_patch_size: 14 + image_pos_patch_size: 14 + initializer_range: 0.02 + residual_dropout: 0 + resize_mode: default + vit_layers: + - -2 + - -9 + vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt + vocab_size: 152064 + weight_tying: false +multi_component_grad_norm: + value: true +no_pre_train_checkpoint: + value: true +optimizer: + value: + betas: + - 0.9 + - 0.95 + connector_betas: + - 0.9 + - 0.95 + connector_eps: 1e-06 + connector_learning_rate: 0.0002 + connector_weight_decay: 0 + eps: 1e-05 + learning_rate: 0.0001 + llm_betas: + - 0.9 + - 0.95 + llm_eps: 1e-06 + llm_learning_rate: 5e-05 + llm_weight_decay: 0 + metrics_log_interval: 20 + name: adamw + vit_betas: + - 0.9 + - 0.95 + vit_eps: 1e-06 + vit_learning_rate: 6e-06 + vit_weight_decay: 0 + weight_decay: 0.01 +precision: + value: amp_bf16 +python_profiling: + value: false +remote_save_folder: + value: null +reset_dataloader_state: + value: false +reset_optimizer_state: + value: false +reset_trainer_state: + value: false +restore_dataloader: + value: true +run_name: + value: cleandesk50_20251008_163748 +save_dataloader_state: + value: false +save_folder: + value: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk50_l1_regression +save_interval: + value: 500 +save_interval_action_head: + value: 500 +save_interval_ephemeral: + value: null +save_interval_unsharded: + value: 500 +save_num_action_head_checkpoints_to_keep: + value: 2 +save_num_checkpoints_to_keep: + value: 1 +save_num_unsharded_checkpoints_to_keep: + value: 1 +save_overwrite: + value: true +scheduler: + value: + alpha_f: 0.1 + connector_t_warmup: 200 + grad_clip_warmup_factor: null + grad_clip_warmup_steps: null + llm_t_warmup: 2000 + name: multimodal + t_max: null + t_warmup: 100 + units: steps + vit_t_warmup: 2000 + warmup_min_lr: 0 +seed: + value: 6198 +sharded_checkpointer: + value: torch_legacy +softmax_auxiliary_loss: + value: true +softmax_auxiliary_loss_scale: + value: 0.0001 +speed_monitor: + value: + gpu_flops_available: null + window_size: 20 +stop_after: + value: null +stop_at: + value: 500000 +time_limit: + value: null +torch_profiling: + value: false +train_exit_random_layer: + value: false +use_lora: + value: false diff --git a/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/files/output.log b/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/files/output.log new file mode 100644 index 0000000000000000000000000000000000000000..3389ea3b5f37c61a8c7997169a1ef3ebd97e1251 --- /dev/null +++ b/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/files/output.log @@ -0,0 +1,186 @@ +wandb: Detected [openai] in use. +wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script. +wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/ +10/08 [16:38:33] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109 + device id is provided via `init_process_group` or `barrier `. Using the current device set by the user. + warnings.warn( # warn only once + +****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_CleanDesk50', 8, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 8, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 8, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}} +****** Skip RLDS main; path not found: None +****** start build LeRobot main... +build_tokenizer, cache_dir None tokenizer_dir None +10/08 [16:38:35] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:130 +10/08 [16:38:36] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:436 +****** before LeRobot dataset... +****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_CleanDesk50 +****** length of the dataset: 27906 +10/08 [16:38:38] INFO | >> build_rlds_train_dataset: Loading train dataset: vla_dataset_realworld/train __init__.py:519 +****** Import RLDSBatchTransform, RLDSDataset successfully. +****** before RLDS dataset... +****** data_config.rlds_dataset_name: a1_real_world +****** data_config.rlds_data_root_dir: /vast/users/xiaodan/zhangjian/datasets/OXE +214************** + INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 87212/87212 [00:44<00:00, 1952.50it/s] +214************** +10/08 [16:39:27] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/jaco_play/0.1.0/dataset_statistics_e081d4716a3da95df91c79d661ae59fa26a43da49db4bf8d716b622b56 + 3b0ea3.json. +214************** +10/08 [16:39:28] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/berkeley_cable_routing/0.1.0/dataset_statistics_08cb4c5b7c5e6c035fc84ea85b2d54c0c46ad608a8763 + 4ebb18374088d23cd76.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/viola/0.1.0/dataset_statistics_2415d8f7de73c8761fedd7c2a9590667fb0d3fdd26664bf4c100222e5cdb89 + b9.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/berkeley_autolab_ur5/0.1.0/dataset_statistics_1b798b015e7b2c4e4396719e3aa4d43a2f400b2edf5dbb0 + 820cb3df6943d8ddc.json. +214************** +10/08 [16:39:29] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/austin_buds_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_ccecde24cc01793b221 + 4eb0c4c5d7cc0e3ccc623db99bd892b83552b20decfb7.json. +214************** + INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 456/456 [00:25<00:00, 17.70it/s] +214************** +10/08 [16:39:57] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 5100/5100 [01:00<00:00, 84.00it/s] +214************** +10/08 [16:41:03] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 240/240 [00:05<00:00, 46.96it/s] +214************** +10/08 [16:41:09] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/austin_sirius_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_cb2e0273f80029a19 + dc3dbb3a3a4118a5598e7bff3ff0245891255825b04b42a.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/dlr_edan_shared_control_converted_externally_to_rlds/0.1.0/dataset_statistics_b8984563fc3e7ea + c0803c667ef58c9deaf2e747683568306ea1d83505d532a76.json. +214************** +10/08 [16:41:10] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 1500/1500 [00:02<00:00, 544.82it/s] +214************** +10/08 [16:41:14] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/berkeley_fanuc_manipulation/0.1.0/dataset_statistics_a98d349d0364668095ea3ca38c6785e94f35e5e5 + 8e234c88fac83775a923b0d0.json. +214************** +10/08 [16:41:15] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 43264/43264 [00:51<00:00, 836.91it/s] +214************** +10/08 [16:42:10] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/roboturk/0.1.0/dataset_statistics_3aa821e17a2937f941d4102cfadcb1154853cb45dcec07ccc66893b01f6 + f1b40.json. +214************** +10/08 [16:42:11] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/toto/0.1.0/dataset_statistics_505a51eb76e85fe0969e8e70e45fb8c9ae5d3b1fae2851c7899bea91f74b979 + 0.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/ucsd_kitchen_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_1f1a5f310a2d5a6edc + 0e217370e135c8c8598290f11f57025037adcb0d033926.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/iamlab_cmu_pickup_insert_converted_externally_to_rlds/0.1.0/dataset_statistics_698a1f892f8866 + af9cb4bd5a23611fa44d8c7d9d816f9b3049d2fc3b62442079.json. + +###################################################################################### +# Loading the following 18 datasets (incl. sampling weight): # +# fractal20220817_data: ====================================================0.529250 # +# jaco_play: ===============================================================0.010898 # +# berkeley_cable_routing: ==================================================0.005916 # +# viola: ===================================================================0.021337 # +# berkeley_autolab_ur5: ====================================================0.027379 # +# austin_buds_dataset_converted_externally_to_rlds: ========================0.004768 # +# nyu_franka_play_dataset_converted_externally_to_rlds: ====================0.018817 # +# furniture_bench_dataset_converted_externally_to_rlds: ====================0.055185 # +# austin_sailor_dataset_converted_externally_to_rlds: ======================0.049354 # +# austin_sirius_dataset_converted_externally_to_rlds: ======================0.039129 # +# dlr_edan_shared_control_converted_externally_to_rlds: ====================0.001248 # +# utaustin_mutex: ==========================================================0.050583 # +# berkeley_fanuc_manipulation: =============================================0.017504 # +# bc_z: ====================================================================0.168166 # +# roboturk: ================================================================0.000131 # +# toto: ====================================================================0.000228 # +# ucsd_kitchen_dataset_converted_externally_to_rlds: =======================0.000006 # +# iamlab_cmu_pickup_insert_converted_externally_to_rlds: ===================0.000102 # +###################################################################################### + + INFO | >> [*] Threads per Dataset: [14 1 1 1 1 1 1 2 1 1 1 1 1 5 1 1 1 1] dataset.py:563 + INFO | >> [*] Reads per Dataset: [14 1 1 1 1 1 1 2 1 1 1 1 1 5 1 1 1 1] dataset.py:564 + INFO | >> [*] Constructing datasets... dataset.py:567 +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +10/08 [16:42:16] INFO | >> [*] Applying frame transforms on dataset... dataset.py:607 +****** after RLDSDataset initialization! +****** length of the dataset: 7154275 +****** Build rlds train dataset: IterableDatasetWrapper successfully. +****** path: None +****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None +****** After build vla train dataset... +****** iterable_sources: [, ] +****** Before build mixed iterable dataset... +****** Build vla train dataloader successfully! +************************* Build train_dataloader successful! +************************* Before build_inf_evaluators +10/08 [16:42:17] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109 + device id is provided via `init_process_group` or `barrier `. Using the current device set by the user. + warnings.warn( # warn only once + +************************* Build evaluators successful! +************************* Early exit flags: early_exit=False +PROPRIO_DIM 16 does not match ACTION_DIM 16 for AffordVLA +************************* Initialize model successful! +***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt +***** Load checkpoint successful! +missing keys: ['action_head.model.layer_norm1.weight', 'action_head.model.layer_norm1.bias', 'action_head.model.fc1.weight', 'action_head.model.fc1.bias', 'action_head.model.mlp_resnet_blocks.0.ffn.0.weight', 'action_head.model.mlp_resnet_blocks.0.ffn.0.bias', 'action_head.model.mlp_resnet_blocks.0.ffn.1.weight', 'action_head.model.mlp_resnet_blocks.0.ffn.1.bias', 'action_head.model.mlp_resnet_blocks.1.ffn.0.weight', 'action_head.model.mlp_resnet_blocks.1.ffn.0.bias', 'action_head.model.mlp_resnet_blocks.1.ffn.1.weight', 'action_head.model.mlp_resnet_blocks.1.ffn.1.bias', 'action_head.model.layer_norm2.weight', 'action_head.model.layer_norm2.bias', 'action_head.model.fc2.weight', 'action_head.model.fc2.bias', 'proprio_projector.fc1.weight', 'proprio_projector.fc1.bias', 'proprio_projector.fc2.weight', 'proprio_projector.fc2.bias'] +unexpected keys: [] +************************* Initialize model successful! +************************* Before FSDP model wrapping +************************* FSDP model wrapping successful! +************************* Before building optimizer and scheduler +10/08 [16:44:19] INFO | >> Constructing optimizer with 2 param groups optim.py:1283 +************************************************** +After building optimizer and scheduler and model, before training, peak GPU memory (MB): 35614 +************************* VLATrainer initialized successfully! +************************* Before trainer.fit() +Pre-train system metrics + System/Peak GPU Memory (MB)=35,614 +10/08 [16:44:31] WARNING | >> /vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py:200: UserWarning: To copy construct from a tensor, it is recommended to use warnings.py:109 + sourceTensor.detach().clone() or sourceTensor.detach().clone().requires_grad_(True), rather than torch.tensor(sourceTensor). + timestep_list = [torch.tensor(ex["timestep"], dtype=torch.int64) for ex in batch] + +!!!Training failed: stack expects each tensor to be equal size, but got [] at entry 0 and [1] at entry 1 +Traceback (most recent call last): + File "/vast/users/xiaodan/zhangjian/A1/scripts/train_for_action.py", line 593, in main + trainer.fit() + File "/vast/users/xiaodan/zhangjian/A1/olmo/train.py", line 2284, in fit + for batch in self.train_loader: + File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/utils/data/dataloader.py", line 734, in __next__ + data = self._next_data() + File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/utils/data/dataloader.py", line 790, in _next_data + data = self._dataset_fetcher.fetch(index) # may raise StopIteration + File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/utils/data/_utils/fetch.py", line 43, in fetch + return self.collate_fn(data) + File "/vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py", line 201, in __call__ + out['timestep'] = torch.stack(timestep_list, dim=0) +RuntimeError: stack expects each tensor to be equal size, but got [] at entry 0 and [1] at entry 1 +wandb: WARNING The `quiet` argument to `wandb.run.finish()` is deprecated, use `wandb.Settings(quiet=...)` to set this instead. diff --git a/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/files/requirements.txt b/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/files/requirements.txt new file mode 100644 index 0000000000000000000000000000000000000000..5a5e971a5d9f3b6f6a75248e203682c5fbcd69e8 --- /dev/null +++ b/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/files/requirements.txt @@ -0,0 +1,286 @@ +ai2-molmo==0.0.0 +astunparse==1.6.3 +flatbuffers==25.2.10 +gast==0.6.0 +google-pasta==0.2.0 +h5py==3.14.0 +libclang==18.1.1 +Markdown==3.9 +namex==0.1.0 +opt_einsum==3.4.0 +optree==0.17.0 +tensorboard-data-server==0.7.2 +tensorflow-io-gcs-filesystem==0.37.1 +termcolor==3.1.0 +Werkzeug==3.1.3 +Brotli==1.1.0 +Farama-Notifications==0.0.4 +MarkupSafe==2.1.5 +PyYAML==6.0.2 +absl-py==2.3.1 +accelerate==1.10.1 +ai2-molmo==0.0.0 +aiofiles==24.1.0 +aiohappyeyeballs==2.6.1 +aiohttp==3.12.15 +aiosignal==1.4.0 +annotated-types==0.7.0 +antlr4-python3-runtime==4.9.3 +anyio==4.10.0 +array_record==0.8.1 +async-timeout==5.0.1 +attrs==25.3.0 +av==15.1.0 +backports.tarfile==1.2.0 +beaker-gantry==3.2.0 +beaker-py==2.5.0 +black==23.12.1 +blinker==1.9.0 +boltons==25.0.0 +boto3==1.40.33 +botocore==1.40.33 +build==1.3.0 +cached_path==1.7.3 +cached-property==2.0.1 +cachetools==5.5.2 +certifi==2025.8.3 +cffi==2.0.0 +charset-normalizer==3.4.3 +click==8.2.1 +click-help-colors==0.9.4 +click-option-group==0.5.7 +cloudpickle==3.1.1 +cmake==4.1.0 +contourpy==1.3.2 +cryptography==46.0.1 +cycler==0.12.1 +dataclass-extensions==0.2.3 +datasets==3.6.0 +decorator==5.2.1 +deepdiff==8.6.1 +diffusers==0.35.1 +dill==0.3.8 +distro==1.9.0 +dlimp==0.0.1 +dm-tree==0.1.9 +docutils==0.22.1 +draccus==0.10.0 +editdistance==0.8.1 +einops==0.8.1 +einops-exts==0.0.4 +et_xmlfile==2.0.0 +etils==1.13.0 +evdev==1.9.2 +exceptiongroup==1.3.0 +face==24.0.0 +fastapi==0.116.2 +ffmpy==0.6.1 +fiddle==0.3.0 +filelock==3.13.1 +Flask==3.1.2 +fonttools==4.60.0 +frozenlist==1.7.0 +fsspec==2023.9.2 +ftfy==6.3.1 +gcsfs==2023.9.2 +gitdb==4.0.12 +GitPython==3.1.45 +glom==24.11.0 +google-api-core==2.25.1 +google-auth==2.40.3 +google-auth-oauthlib==1.2.2 +google-cloud-core==2.4.3 +google-cloud-storage==2.19.0 +google-crc32c==1.7.1 +google-resumable-media==2.7.2 +googleapis-common-protos==1.70.0 +gradio==5.46.0 +gradio_client==1.13.0 +graphviz==0.21 +groovy==0.1.2 +grpcio==1.75.0 +gymnasium==0.29.1 +h11==0.16.0 +hf_transfer==0.1.9 +hf-xet==1.1.10 +httpcore==1.0.9 +httpx==0.28.1 +huggingface-hub==0.35.0 +id==1.5.0 +idna==3.10 +imageio==2.37.0 +imageio-ffmpeg==0.6.0 +importlib_metadata==8.7.0 +importlib_resources==6.5.2 +iniconfig==2.1.0 +inquirerpy==0.3.4 +isort==5.12.0 +itsdangerous==2.2.0 +jaraco.classes==3.4.0 +jaraco.context==6.0.1 +jaraco.functools==4.3.0 +jeepney==0.9.0 +Jinja2==3.1.4 +jiter==0.11.0 +jmespath==1.0.1 +joblib==1.5.2 +jsonlines==4.0.0 +keras==2.15.0 +keyring==25.6.0 +kiwisolver==1.4.9 +latex2sympy2_extended==1.10.2 +lerobot==0.3.4 +Levenshtein==0.27.1 +libcst==1.8.4 +lightning-utilities==0.15.2 +markdown-it-py==4.0.0 +math-verify==0.8.0 +matplotlib==3.10.6 +mdurl==0.1.2 +mergedeep==1.3.4 +ml-dtypes==0.2.0 +ml_dtypes==0.5.3 +more-itertools==10.8.0 +mpmath==1.3.0 +msgspec==0.19.0 +multidict==6.6.4 +multiprocess==0.70.16 +mypy==1.3.0 +mypy_extensions==1.1.0 +necessary==0.4.3 +networkx==3.3 +nh3==0.3.0 +nltk==3.9.1 +numpy==1.26.4 +oauthlib==3.3.1 +omegaconf==2.3.0 +openai==1.108.0 +opencv-python-headless==4.12.0.88 +OpenEXR==3.4.0 +openpyxl==3.1.5 +orderly-set==5.5.0 +orjson==3.11.3 +packaging==25.0 +pandas==2.3.2 +pathspec==0.12.1 +petname==2.6 +pfzy==0.3.4 +pillow==11.0.0 +pip==25.2 +platformdirs==4.4.0 +pluggy==1.6.0 +promise==2.3 +prompt_toolkit==3.0.52 +propcache==0.3.2 +proto-plus==1.26.1 +protobuf==4.21.12 +protobuf==6.32.1 +psutil==7.1.0 +pyarrow==21.0.0 +pyasn1==0.6.1 +pyasn1_modules==0.4.2 +pycparser==2.23 +pydantic==2.11.9 +pydantic_core==2.33.2 +pydub==0.25.1 +Pygments==2.19.2 +pynput==1.8.1 +pyparsing==3.2.4 +pyproject_hooks==1.2.0 +pyserial==3.5 +pytest==8.4.2 +pytest-sphinx==0.6.3 +python-dateutil==2.9.0.post0 +python-Levenshtein==0.27.1 +python-multipart==0.0.20 +python-xlib==0.33 +pytorch-triton-rocm==3.4.0 +pytz==2025.2 +pyyaml-include==1.4.1 +RapidFuzz==3.14.1 +readme_renderer==44.0 +regex==2025.9.1 +requests==2.32.5 +requests-oauthlib==2.0.0 +requests-toolbelt==1.0.0 +requirements-parser==0.13.0 +rerun-sdk==0.22.1 +rfc3986==2.0.0 +rich==13.9.4 +rsa==4.9.1 +ruff==0.13.0 +s3transfer==0.14.0 +safehttpx==0.1.6 +safetensors==0.6.2 +scikit-learn==1.7.2 +scipy==1.15.3 +SecretStorage==3.4.0 +semantic-version==2.10.0 +sentencepiece==0.2.1 +sentry-sdk==2.38.0 +setuptools==78.1.1 +shellingham==1.5.4 +six==1.17.0 +smart_open==7.3.1 +smashed==0.21.5 +smmap==5.0.2 +sniffio==1.3.1 +starlette==0.48.0 +sympy==1.13.3 +tensorboard==2.15.2 +tensorboard==2.19.0 +tensorflow==2.15.0 +tensorflow-addons==0.23.0 +tensorflow-datasets==4.9.3 +tensorflow-estimator==2.15.0 +tensorflow-graphics==2021.12.3 +tensorflow-metadata==1.17.2 +threadpoolctl==3.6.0 +timm==1.0.19 +tokenizers==0.22.0 +toml==0.10.2 +tomli==2.2.1 +tomlkit==0.13.3 +torch==2.8.0+rocm6.4 +torchcodec==0.5 +torchmetrics==1.8.2 +torchvision==0.23.0+rocm6.4 +tqdm==4.67.1 +transformers==4.56.1 +trimesh==4.8.2 +trouting==0.3.3 +twine==6.2.0 +typeguard==2.13.3 +typer==0.17.4 +typing_extensions==4.15.0 +typing-inspect==0.9.0 +typing-inspection==0.4.1 +tzdata==2025.2 +urllib3==2.5.0 +uvicorn==0.35.0 +wandb==0.21.4 +wcwidth==0.2.13 +websockets==15.0.1 +wheel==0.45.1 +wrapt==1.14.2 +xxhash==3.5.0 +yarl==1.20.1 +zipp==3.23.0 +lerobot==0.3.4 +minLoRA==0.1.0 +autocommand==2.2.2 +backports.tarfile==1.2.0 +importlib_metadata==8.0.0 +inflect==7.3.1 +jaraco.collections==5.1.0 +jaraco.context==5.3.0 +jaraco.functools==4.0.1 +jaraco.text==3.12.1 +more-itertools==10.3.0 +packaging==24.2 +platformdirs==4.2.2 +tomli==2.0.1 +typeguard==4.3.0 +typing_extensions==4.12.2 +wheel==0.45.1 +zipp==3.19.2 diff --git a/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/files/wandb-metadata.json b/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/files/wandb-metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..4314b8dc34fe9f1cccbc37df4c1fe25f63cefade --- /dev/null +++ b/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/files/wandb-metadata.json @@ -0,0 +1,204 @@ +{ + "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35", + "python": "CPython 3.10.18", + "startedAt": "2025-10-08T16:38:31.458924Z", + "args": [ + "qwen2_7b", + "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk50_l1_regression", + "--vision_backbone", + "openai", + "--action_head", + "l1_regression", + "--seq_len", + "1600", + "--ft_llm", + "--checkpoint", + "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924", + "--device_train_microbatch_size", + "16", + "--global_batch_size", + "126", + "--dataset", + "vla_dataset_realworld", + "--llm_learning_rate", + "5e-5", + "--wandb_entity", + "henryeap", + "--wandb_project", + "a1-realworld", + "--wandb_run_name", + "cleandesk50", + "--real_world_vla_config_path", + "vla_config_realworld/vla_config_cleandesk50.yaml", + "--save_overwrite" + ], + "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py", + "codePath": "launch_scripts/train_vla.py", + "codePathLocal": "launch_scripts/train_vla.py", + "git": { + "remote": "https://github.com/Spatialtemporal-AI/A1.git", + "commit": "49712a42d21a8c739a16ba5eeaec4a0d7b29ab80" + }, + "email": "ihenrykwok@outlook.com", + "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk50_l1_regression/wandb", + "host": "auh7-1b-gpu-188", + "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10", + "cpu_count": 64, + "cpu_count_logical": 128, + "gpu": "Instinct MI210", + "gpu_count": 8, + "disk": { + "/": { + "total": "470343073792", + "used": "52340371456" + } + }, + "memory": { + "total": "2434606964736" + }, + "gpu_amd": [ + { + "id": "7", + "uniqueId": "0x21a2e88d06c419dc", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "4", + "uniqueId": "0xa515afd8ced1d39d", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "2", + "uniqueId": "0x399226d2b2bfa544", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "6", + "uniqueId": "0xfa8b85a4625b04f", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "3", + "uniqueId": "0xf61ec17df11883bd", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "1", + "uniqueId": "0x9b5c1c302c8129f8", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "0", + "uniqueId": "0x3558c3014c813fdb", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "5", + "uniqueId": "0x137c9ede1bb1518e", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + } + ], + "slurm": { + "cluster_name": "ai-04r", + "conf": "/etc/slurm/slurm.conf", + "cpus_on_node": "128", + "gpus_on_node": "8", + "gtids": "0", + "job_account": "faculty-acc", + "job_cpus_per_node": "128", + "job_end_time": "1760200645", + "job_gid": "2000", + "job_gpus": "0,1,2,3,4,5,6,7", + "job_id": "2284", + "job_name": "mh_cleandesk50_l1_regression", + "job_nodelist": "auh7-1b-gpu-188", + "job_num_nodes": "1", + "job_partition": "faculty", + "job_qos": "xdqos", + "job_start_time": "1759941445", + "job_uid": "2013", + "job_user": "xiaodan", + "jobid": "2284", + "localid": "0", + "nnodes": "1", + "nodeid": "0", + "nodelist": "auh7-1b-gpu-188", + "nprocs": "1", + "ntasks": "1", + "ntasks_per_node": "1", + "oom_kill_step": "0", + "prio_process": "0", + "procid": "0", + "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts", + "submit_host": "auh-1b-cpu-login-001", + "task_pid": "2621518", + "tasks_per_node": "1", + "topology_addr": "auh7-1b-gpu-188", + "topology_addr_pattern": "node" + }, + "writerId": "da16lrefa3ue6fcq4audbkzfio2vskvf" +} \ No newline at end of file diff --git a/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/files/wandb-summary.json b/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/files/wandb-summary.json new file mode 100644 index 0000000000000000000000000000000000000000..19dd8c75e7658f1e16eeea752065b6189505636a --- /dev/null +++ b/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/files/wandb-summary.json @@ -0,0 +1 @@ +{"_step":0,"_wandb":{"runtime":361},"_runtime":361.82454539,"System/Peak GPU Memory (MB)":35614.78125,"_timestamp":1.7599418591639297e+09} \ No newline at end of file diff --git a/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/logs/debug-core.log b/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/logs/debug-core.log new file mode 100644 index 0000000000000000000000000000000000000000..45b5ddc2f86290b3379d9ba77c39716b65a5932c --- /dev/null +++ b/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/logs/debug-core.log @@ -0,0 +1,16 @@ +{"time":"2025-10-08T16:38:31.69984144Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpzewm22rr/port-2621708.txt","pid":2621708,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false} +{"time":"2025-10-08T16:38:31.702272712Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":2621708} +{"time":"2025-10-08T16:38:31.702674102Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-2621708-2621877-1682313073/socket","Net":"unix"}} +{"time":"2025-10-08T16:38:31.710784598Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"} +{"time":"2025-10-08T16:38:31.724491738Z","level":"INFO","msg":"handleInformInit: received","streamId":"fqdwkc8m","id":"1(@)"} +{"time":"2025-10-08T16:38:33.081443256Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"fqdwkc8m","id":"1(@)"} +{"time":"2025-10-08T16:44:37.411729039Z","level":"INFO","msg":"handleInformFinish: finish message received","streamId":"fqdwkc8m","id":"1(@)"} +{"time":"2025-10-08T16:44:37.41421139Z","level":"INFO","msg":"handleInformFinish: stream closed","streamId":"fqdwkc8m","id":"1(@)"} +{"time":"2025-10-08T16:44:37.461669803Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"} +{"time":"2025-10-08T16:44:37.461695793Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"} +{"time":"2025-10-08T16:44:37.461702223Z","level":"INFO","msg":"server is shutting down"} +{"time":"2025-10-08T16:44:37.461709833Z","level":"INFO","msg":"connection: closing","id":"1(@)"} +{"time":"2025-10-08T16:44:37.461743853Z","level":"INFO","msg":"connection: closed successfully","id":"1(@)"} +{"time":"2025-10-08T16:44:37.461747193Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"} +{"time":"2025-10-08T16:44:37.461760803Z","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-2621708-2621877-1682313073/socket","Net":"unix"}} +{"time":"2025-10-08T16:44:37.461786643Z","level":"INFO","msg":"server is closed"} diff --git a/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/logs/debug-internal.log b/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/logs/debug-internal.log new file mode 100644 index 0000000000000000000000000000000000000000..66a0fb2bb4c67d7f04a61c0c9f52c0db563747b5 --- /dev/null +++ b/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/logs/debug-internal.log @@ -0,0 +1,12 @@ +{"time":"2025-10-08T16:38:31.726288089Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"} +{"time":"2025-10-08T16:38:33.081399086Z","level":"INFO","msg":"stream: created new stream","id":"fqdwkc8m"} +{"time":"2025-10-08T16:38:33.081437966Z","level":"INFO","msg":"stream: started","id":"fqdwkc8m"} +{"time":"2025-10-08T16:38:33.081464946Z","level":"INFO","msg":"sender: started","stream_id":"fqdwkc8m"} +{"time":"2025-10-08T16:38:33.081464936Z","level":"INFO","msg":"writer: started","stream_id":"fqdwkc8m"} +{"time":"2025-10-08T16:38:33.081488306Z","level":"INFO","msg":"handler: started","stream_id":"fqdwkc8m"} +{"time":"2025-10-08T16:44:35.233389442Z","level":"INFO","msg":"handler: operation stats","stats":{"operations":[{"desc":"updating run metadata","runtime_seconds":0.00059375}],"total_operations":1}} +{"time":"2025-10-08T16:44:37.058187164Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"} +{"time":"2025-10-08T16:44:37.412033949Z","level":"INFO","msg":"stream: closing","id":"fqdwkc8m"} +{"time":"2025-10-08T16:44:37.412048989Z","level":"INFO","msg":"handler: closed","stream_id":"fqdwkc8m"} +{"time":"2025-10-08T16:44:37.4130748Z","level":"INFO","msg":"sender: closed","stream_id":"fqdwkc8m"} +{"time":"2025-10-08T16:44:37.41308173Z","level":"INFO","msg":"stream: closed","id":"fqdwkc8m"} diff --git a/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/logs/debug.log b/cleandesk50_l1_regression/wandb/wandb/run-20251008_163831-fqdwkc8m/logs/debug.log new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/cleandesk_flow_matching/step11500-action-head/metadata.pt b/cleandesk_flow_matching/step11500-action-head/metadata.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e34304d65d6217c2b0a33ee0a75ccecc5e8f82c --- /dev/null +++ b/cleandesk_flow_matching/step11500-action-head/metadata.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fb72b6306ce04d1beb20bb289509f00c39a40845ff7c4b36bf4deb4e83fe82a +size 1331 diff --git a/cleandesk_flow_matching/step12000-unsharded/config.yaml b/cleandesk_flow_matching/step12000-unsharded/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..237ca7ca5a155016aae5d937be50254d7ace7f20 --- /dev/null +++ b/cleandesk_flow_matching/step12000-unsharded/config.yaml @@ -0,0 +1,322 @@ +run_name: cleandesk_20251005_163721 +seed: 6198 +epoch: null +dry_run: false +model: + d_model: 3584 + n_heads: 28 + n_kv_heads: 4 + qkv_bias: true + clip_qkv: null + n_layers: 28 + mlp_ratio: 4 + mlp_hidden_size: 37888 + activation_type: swiglu + block_type: sequential + block_group_size: 1 + rope: true + rope_full_precision: true + rope_theta: 1000000.0 + vision_backbone: + image_model_type: openai + image_default_input_size: + - 336 + - 336 + image_patch_size: 14 + image_pos_patch_size: 14 + image_emb_dim: 1024 + image_num_heads: 16 + image_num_key_value_heads: 16 + image_num_layers: 23 + image_head_dim: 64 + image_mlp_dim: 4096 + image_mlp_activations: quick_gelu + image_dropout_rate: 0.0 + image_num_pos: 577 + image_norm_eps: 1.0e-05 + attention_dropout: 0.0 + residual_dropout: 0.0 + initializer_range: 0.02 + fsdp_wrap: false + resize_mode: default + vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt + llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt + low_cpu_fsdp: true + attention_type: sdpa + float32_attention: true + attention_dropout: 0.0 + attention_layer_norm: false + residual_dropout: 0.1 + response_residual_dropout: 0.0 + embedding_dropout: 0.0 + layer_norm_type: rms + layer_norm_with_affine: true + layer_norm_eps: 1.0e-06 + attention_layer_norm_with_affine: true + max_sequence_length: 4096 + max_position_embeddings: null + include_bias: false + bias_for_layer_norm: null + scale_logits: false + vocab_size: 152064 + embedding_size: 152064 + ff_out_size: null + additional_vocab_size: 128 + new_embedding_init_range: 0.02 + weight_tying: false + init_device: null + init_fn: normal + init_std: 0.02 + init_cutoff_factor: null + norm_after: false + precision: amp_bf16 + max_crops: 12 + crop_mode: overlap-and-resize-c2 + use_col_tokens: true + prompt_type: uber_model + system_prompt_kind: demo_or_style + message_formatting: role + always_start_with_space: true + multi_annotation_weighting: root_subsegments + default_inference_len: 65 + overlap_margins: + - 4 + - 4 + pad_value: 0.0 + image_padding_embed: pad_and_partial_pad + fix_image_padding: true + vit_layers: + - -2 + - -9 + image_pooling_h: 2 + image_pooling_w: 2 + image_pooling_2d: attention_meanq + image_projector: mlp + image_feature_dropout: 0.0 + initializer_range: 0.02 + normalize_input_embeds: false + use_position_ids: true + head_dim: null + action_tokenizer: + identifier: physical-intelligence/fast + tokenizer_dir: null + action_dim: 7 + horizon: 8 + tokenizer: + identifier: Qwen/Qwen2-7B + tokenizer_dir: null + pad_tokenizer: true + moe_num_experts: 8 + moe_top_k: 2 + moe_mlp_impl: sparse + moe_log_expert_assignment: false + moe_shared_expert: false + moe_lbl_in_fp32: false + moe_interleave: false + moe_loss_weight: 0.1 + moe_zloss_weight: null + moe_dropless: true + moe_capacity_factor: 1.25 + action_head: flow_matching + num_diffusion_steps: 1000 + num_diffusion_inference_steps: 30 + use_proprio: true + action_head_dit_hidden_size: 1152 + action_head_dit_depth: 28 + action_head_dit_num_heads: 16 + llm_causal_attention: false + action_use_left_eef: true + action_use_mobile_base: false +allow_resume: false +ft_llm: true +ft_vit: false +ft_connector: false +ft_embedding: lm_head +lora: false +use_lora: true +lora_rank: 8 +lora_llm: false +lora_vit: false +lora_connector: false +early_exit: false +train_exit_random_layer: false +optimizer: + name: adamw + learning_rate: 0.0001 + weight_decay: 0.01 + betas: + - 0.9 + - 0.95 + eps: 1.0e-05 + connector_learning_rate: 0.0002 + vit_learning_rate: 6.0e-06 + llm_learning_rate: 5.0e-05 + connector_weight_decay: 0.0 + vit_weight_decay: 0.0 + llm_weight_decay: 0.0 + connector_betas: + - 0.9 + - 0.95 + vit_betas: + - 0.9 + - 0.95 + llm_betas: + - 0.9 + - 0.95 + connector_eps: 1.0e-06 + vit_eps: 1.0e-06 + llm_eps: 1.0e-06 + metrics_log_interval: 20 +scheduler: + name: multimodal + units: steps + t_warmup: 100 + t_max: null + alpha_f: 0.1 + connector_t_warmup: 200 + vit_t_warmup: 2000 + llm_t_warmup: 2000 + grad_clip_warmup_steps: null + grad_clip_warmup_factor: null + warmup_min_lr: 0.0 +data: + dataset: vla_dataset_realworld + mixture: null + root_size_mixture: null + split: train + seed: 95818 + shuffle_messages: false + pad: to_max + sequence_length: 1600 + shuffle: true + for_inference: false + multi_modal: torch + num_workers: 0 + drop_last: true + pin_memory: true + prefetch_factor: null + persistent_workers: false + timeout: 0 + rlds_dataset_name: libero_4_task_suites_no_noops + rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_CleanDesk + use_wrist_image: true + use_proprio: true + rlds_shuffle_buffer_size: 100000 + rlds_traj_threads: 8 + rlds_read_threads: 8 + lerobot_episode_index_start: null + lerobot_episode_index_end: null +restore_dataloader: true +fast_forward_batches: null +evaluators: +- label: val + data: + dataset: vla_dataset_realworld + mixture: null + root_size_mixture: null + split: validation + seed: null + shuffle_messages: false + pad: to_max + sequence_length: 1600 + shuffle: false + for_inference: false + multi_modal: torch + num_workers: 0 + drop_last: true + pin_memory: true + prefetch_factor: null + persistent_workers: true + timeout: 0 + rlds_dataset_name: libero_4_task_suites_no_noops + rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds + use_wrist_image: true + use_proprio: true + rlds_shuffle_buffer_size: 256000 + rlds_traj_threads: 8 + rlds_read_threads: 8 + lerobot_episode_index_start: 353 + lerobot_episode_index_end: 765 + device_eval_batch_size: null + subset_num_batches: 64 + max_examples: null + max_new_tokens: 448 + mm_evaluator: null + save_dir: null + save_to_checkpoint_dir: false + eval_name: null + skip_if_metrics_cached: true +eval_interval: 0 +inf_eval_interval: -1 +inf_evaluators: [] +save_folder: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk_flow_matching +remote_save_folder: null +canceled_check_interval: 50 +save_interval: 500 +save_interval_unsharded: 500 +save_interval_ephemeral: null +save_interval_action_head: 500 +save_num_checkpoints_to_keep: 1 +save_num_unsharded_checkpoints_to_keep: 1 +save_num_action_head_checkpoints_to_keep: 2 +save_overwrite: true +force_save_unsharded: false +no_pre_train_checkpoint: true +initial_model_checkpoint: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924 +load_model_config: null +checkpoint_dir: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924 +load_path: null +load_path_sharded_checkpointer: null +reset_optimizer_state: false +reset_trainer_state: false +save_dataloader_state: false +reset_dataloader_state: false +keep_lr_on_load: true +sharded_checkpointer: torch_legacy +max_duration: 500000 +global_train_batch_size: 126 +device_train_batch_size: 15 +device_train_microbatch_size: 16 +device_eval_batch_size: 4 +eval_subset_num_batches: -1 +eval_on_load: false +device_inf_eval_batch_size: 16 +inf_eval_subset_num_batches: -1 +device_train_grad_accum: 0 +max_grad_norm: 1.0 +multi_component_grad_norm: true +batch_divisor: global_batch +max_grad_norm_ratio: null +precision: amp_bf16 +wandb: + project: a1-realworld + entity: henryeap + group: null + name: cleandesk_20251005_163721 + tags: + - watching + log_artifacts: false + rank_zero_only: true + log_interval: 1 +speed_monitor: + window_size: 20 + gpu_flops_available: null +console_log_interval: 1 +gen1_gc_interval: 1 +compile: null +fsdp: + use_orig_params: true + sharding_strategy: FULL_SHARD + wrapping_strategy: by_block_and_size + precision: float + hybrid_sharding_num_model_replicas: null +softmax_auxiliary_loss: true +softmax_auxiliary_loss_scale: 0.0001 +time_limit: null +extra_steps_after_cancel: 10 +python_profiling: false +torch_profiling: false +stop_at: 500000 +stop_after: null +activation_checkpointing: whole_layer +fused_loss: null diff --git a/cleandesk_flow_matching/step12000/config.yaml b/cleandesk_flow_matching/step12000/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..237ca7ca5a155016aae5d937be50254d7ace7f20 --- /dev/null +++ b/cleandesk_flow_matching/step12000/config.yaml @@ -0,0 +1,322 @@ +run_name: cleandesk_20251005_163721 +seed: 6198 +epoch: null +dry_run: false +model: + d_model: 3584 + n_heads: 28 + n_kv_heads: 4 + qkv_bias: true + clip_qkv: null + n_layers: 28 + mlp_ratio: 4 + mlp_hidden_size: 37888 + activation_type: swiglu + block_type: sequential + block_group_size: 1 + rope: true + rope_full_precision: true + rope_theta: 1000000.0 + vision_backbone: + image_model_type: openai + image_default_input_size: + - 336 + - 336 + image_patch_size: 14 + image_pos_patch_size: 14 + image_emb_dim: 1024 + image_num_heads: 16 + image_num_key_value_heads: 16 + image_num_layers: 23 + image_head_dim: 64 + image_mlp_dim: 4096 + image_mlp_activations: quick_gelu + image_dropout_rate: 0.0 + image_num_pos: 577 + image_norm_eps: 1.0e-05 + attention_dropout: 0.0 + residual_dropout: 0.0 + initializer_range: 0.02 + fsdp_wrap: false + resize_mode: default + vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt + llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt + low_cpu_fsdp: true + attention_type: sdpa + float32_attention: true + attention_dropout: 0.0 + attention_layer_norm: false + residual_dropout: 0.1 + response_residual_dropout: 0.0 + embedding_dropout: 0.0 + layer_norm_type: rms + layer_norm_with_affine: true + layer_norm_eps: 1.0e-06 + attention_layer_norm_with_affine: true + max_sequence_length: 4096 + max_position_embeddings: null + include_bias: false + bias_for_layer_norm: null + scale_logits: false + vocab_size: 152064 + embedding_size: 152064 + ff_out_size: null + additional_vocab_size: 128 + new_embedding_init_range: 0.02 + weight_tying: false + init_device: null + init_fn: normal + init_std: 0.02 + init_cutoff_factor: null + norm_after: false + precision: amp_bf16 + max_crops: 12 + crop_mode: overlap-and-resize-c2 + use_col_tokens: true + prompt_type: uber_model + system_prompt_kind: demo_or_style + message_formatting: role + always_start_with_space: true + multi_annotation_weighting: root_subsegments + default_inference_len: 65 + overlap_margins: + - 4 + - 4 + pad_value: 0.0 + image_padding_embed: pad_and_partial_pad + fix_image_padding: true + vit_layers: + - -2 + - -9 + image_pooling_h: 2 + image_pooling_w: 2 + image_pooling_2d: attention_meanq + image_projector: mlp + image_feature_dropout: 0.0 + initializer_range: 0.02 + normalize_input_embeds: false + use_position_ids: true + head_dim: null + action_tokenizer: + identifier: physical-intelligence/fast + tokenizer_dir: null + action_dim: 7 + horizon: 8 + tokenizer: + identifier: Qwen/Qwen2-7B + tokenizer_dir: null + pad_tokenizer: true + moe_num_experts: 8 + moe_top_k: 2 + moe_mlp_impl: sparse + moe_log_expert_assignment: false + moe_shared_expert: false + moe_lbl_in_fp32: false + moe_interleave: false + moe_loss_weight: 0.1 + moe_zloss_weight: null + moe_dropless: true + moe_capacity_factor: 1.25 + action_head: flow_matching + num_diffusion_steps: 1000 + num_diffusion_inference_steps: 30 + use_proprio: true + action_head_dit_hidden_size: 1152 + action_head_dit_depth: 28 + action_head_dit_num_heads: 16 + llm_causal_attention: false + action_use_left_eef: true + action_use_mobile_base: false +allow_resume: false +ft_llm: true +ft_vit: false +ft_connector: false +ft_embedding: lm_head +lora: false +use_lora: true +lora_rank: 8 +lora_llm: false +lora_vit: false +lora_connector: false +early_exit: false +train_exit_random_layer: false +optimizer: + name: adamw + learning_rate: 0.0001 + weight_decay: 0.01 + betas: + - 0.9 + - 0.95 + eps: 1.0e-05 + connector_learning_rate: 0.0002 + vit_learning_rate: 6.0e-06 + llm_learning_rate: 5.0e-05 + connector_weight_decay: 0.0 + vit_weight_decay: 0.0 + llm_weight_decay: 0.0 + connector_betas: + - 0.9 + - 0.95 + vit_betas: + - 0.9 + - 0.95 + llm_betas: + - 0.9 + - 0.95 + connector_eps: 1.0e-06 + vit_eps: 1.0e-06 + llm_eps: 1.0e-06 + metrics_log_interval: 20 +scheduler: + name: multimodal + units: steps + t_warmup: 100 + t_max: null + alpha_f: 0.1 + connector_t_warmup: 200 + vit_t_warmup: 2000 + llm_t_warmup: 2000 + grad_clip_warmup_steps: null + grad_clip_warmup_factor: null + warmup_min_lr: 0.0 +data: + dataset: vla_dataset_realworld + mixture: null + root_size_mixture: null + split: train + seed: 95818 + shuffle_messages: false + pad: to_max + sequence_length: 1600 + shuffle: true + for_inference: false + multi_modal: torch + num_workers: 0 + drop_last: true + pin_memory: true + prefetch_factor: null + persistent_workers: false + timeout: 0 + rlds_dataset_name: libero_4_task_suites_no_noops + rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_CleanDesk + use_wrist_image: true + use_proprio: true + rlds_shuffle_buffer_size: 100000 + rlds_traj_threads: 8 + rlds_read_threads: 8 + lerobot_episode_index_start: null + lerobot_episode_index_end: null +restore_dataloader: true +fast_forward_batches: null +evaluators: +- label: val + data: + dataset: vla_dataset_realworld + mixture: null + root_size_mixture: null + split: validation + seed: null + shuffle_messages: false + pad: to_max + sequence_length: 1600 + shuffle: false + for_inference: false + multi_modal: torch + num_workers: 0 + drop_last: true + pin_memory: true + prefetch_factor: null + persistent_workers: true + timeout: 0 + rlds_dataset_name: libero_4_task_suites_no_noops + rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds + use_wrist_image: true + use_proprio: true + rlds_shuffle_buffer_size: 256000 + rlds_traj_threads: 8 + rlds_read_threads: 8 + lerobot_episode_index_start: 353 + lerobot_episode_index_end: 765 + device_eval_batch_size: null + subset_num_batches: 64 + max_examples: null + max_new_tokens: 448 + mm_evaluator: null + save_dir: null + save_to_checkpoint_dir: false + eval_name: null + skip_if_metrics_cached: true +eval_interval: 0 +inf_eval_interval: -1 +inf_evaluators: [] +save_folder: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk_flow_matching +remote_save_folder: null +canceled_check_interval: 50 +save_interval: 500 +save_interval_unsharded: 500 +save_interval_ephemeral: null +save_interval_action_head: 500 +save_num_checkpoints_to_keep: 1 +save_num_unsharded_checkpoints_to_keep: 1 +save_num_action_head_checkpoints_to_keep: 2 +save_overwrite: true +force_save_unsharded: false +no_pre_train_checkpoint: true +initial_model_checkpoint: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924 +load_model_config: null +checkpoint_dir: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924 +load_path: null +load_path_sharded_checkpointer: null +reset_optimizer_state: false +reset_trainer_state: false +save_dataloader_state: false +reset_dataloader_state: false +keep_lr_on_load: true +sharded_checkpointer: torch_legacy +max_duration: 500000 +global_train_batch_size: 126 +device_train_batch_size: 15 +device_train_microbatch_size: 16 +device_eval_batch_size: 4 +eval_subset_num_batches: -1 +eval_on_load: false +device_inf_eval_batch_size: 16 +inf_eval_subset_num_batches: -1 +device_train_grad_accum: 0 +max_grad_norm: 1.0 +multi_component_grad_norm: true +batch_divisor: global_batch +max_grad_norm_ratio: null +precision: amp_bf16 +wandb: + project: a1-realworld + entity: henryeap + group: null + name: cleandesk_20251005_163721 + tags: + - watching + log_artifacts: false + rank_zero_only: true + log_interval: 1 +speed_monitor: + window_size: 20 + gpu_flops_available: null +console_log_interval: 1 +gen1_gc_interval: 1 +compile: null +fsdp: + use_orig_params: true + sharding_strategy: FULL_SHARD + wrapping_strategy: by_block_and_size + precision: float + hybrid_sharding_num_model_replicas: null +softmax_auxiliary_loss: true +softmax_auxiliary_loss_scale: 0.0001 +time_limit: null +extra_steps_after_cancel: 10 +python_profiling: false +torch_profiling: false +stop_at: 500000 +stop_after: null +activation_checkpointing: whole_layer +fused_loss: null diff --git a/cleandesk_flow_matching/wandb/wandb/debug-internal.log b/cleandesk_flow_matching/wandb/wandb/debug-internal.log new file mode 100644 index 0000000000000000000000000000000000000000..1ba7edbb8635596525174158f909fd1d567e371b --- /dev/null +++ b/cleandesk_flow_matching/wandb/wandb/debug-internal.log @@ -0,0 +1,12 @@ +{"time":"2025-10-05T16:38:02.602917026Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"} +{"time":"2025-10-05T16:38:03.762826737Z","level":"INFO","msg":"stream: created new stream","id":"gqyapbwp"} +{"time":"2025-10-05T16:38:03.762885338Z","level":"INFO","msg":"stream: started","id":"gqyapbwp"} +{"time":"2025-10-05T16:38:03.762906828Z","level":"INFO","msg":"writer: started","stream_id":"gqyapbwp"} +{"time":"2025-10-05T16:38:03.762906838Z","level":"INFO","msg":"sender: started","stream_id":"gqyapbwp"} +{"time":"2025-10-05T16:38:03.762920708Z","level":"INFO","msg":"handler: started","stream_id":"gqyapbwp"} +{"time":"2025-10-06T19:04:19.555419176Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded"} +{"time":"2025-10-06T20:03:34.950654374Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded"} +{"time":"2025-10-07T15:02:38.499153299Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded"} +{"time":"2025-10-07T21:28:37.643147942Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"} +{"time":"2025-10-07T22:22:44.986859439Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"} +{"time":"2025-10-07T23:26:33.122893273Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/henryeap/a1-realworld/gqyapbwp/file_stream","body":"\n\n\n502 Server Error\n\n\n

Error: Server Error

\n

The server encountered a temporary error and could not complete your request.

Please try again in 30 seconds.

\n

\n\n"} diff --git a/cleandesk_flow_matching/wandb/wandb/debug.log b/cleandesk_flow_matching/wandb/wandb/debug.log new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/files/output.log b/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/files/output.log new file mode 100644 index 0000000000000000000000000000000000000000..9c84cc65e727fb60866909f1417fbb396e9699c4 --- /dev/null +++ b/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/files/output.log @@ -0,0 +1,62656 @@ +wandb: Detected [openai] in use. +wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script. +wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/ +10/05 [16:38:04] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109 + device id is provided via `init_process_group` or `barrier `. Using the current device set by the user. + warnings.warn( # warn only once + +****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_CleanDesk', 8, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 8, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 8, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}} +****** Skip RLDS main; path not found: None +****** start build LeRobot main... +build_tokenizer, cache_dir None tokenizer_dir None +10/05 [16:38:06] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:130 + INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:435 +****** before LeRobot dataset... +****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_CleanDesk +****** length of the dataset: 72641 +****** Skip RLDS open-source-real-world; mixture 'a1_real_world' not found under: /vast/users/xiaodan/zhangjian/datasets/OXE +****** Expect one of: [] +****** path: None +****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None +****** After build vla train dataset... +****** iterable_sources: [] +****** Before build mixed iterable dataset... +****** Build vla train dataloader successfully! +************************* Build train_dataloader successful! +************************* Before build_inf_evaluators +10/05 [16:38:10] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109 + device id is provided via `init_process_group` or `barrier `. Using the current device set by the user. + warnings.warn( # warn only once + +************************* Build evaluators successful! +************************* Early exit flags: early_exit=False +************************* Initialize model successful! +***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt +***** Load checkpoint successful! +missing keys: ['action_head.state_proj.weight', 'action_head.state_proj.bias', 'action_head.action_in_proj.weight', 'action_head.action_in_proj.bias', 'action_head.action_time_in.weight', 'action_head.action_time_in.bias', 'action_head.action_time_out.weight', 'action_head.action_time_out.bias', 'action_head.memory_proj.weight', 'action_head.memory_proj.bias', 'action_head.gemma.model.layers.0.self_attn.q_proj.weight', 'action_head.gemma.model.layers.0.self_attn.k_proj.weight', 'action_head.gemma.model.layers.0.self_attn.v_proj.weight', 'action_head.gemma.model.layers.0.self_attn.o_proj.weight', 'action_head.gemma.model.layers.0.mlp.gate_proj.weight', 'action_head.gemma.model.layers.0.mlp.up_proj.weight', 'action_head.gemma.model.layers.0.mlp.down_proj.weight', 'action_head.gemma.model.layers.0.input_layernorm.weight', 'action_head.gemma.model.layers.0.post_attention_layernorm.weight', 'action_head.gemma.model.layers.1.self_attn.q_proj.weight', 'action_head.gemma.model.layers.1.self_attn.k_proj.weight', 'action_head.gemma.model.layers.1.self_attn.v_proj.weight', 'action_head.gemma.model.layers.1.self_attn.o_proj.weight', 'action_head.gemma.model.layers.1.mlp.gate_proj.weight', 'action_head.gemma.model.layers.1.mlp.up_proj.weight', 'action_head.gemma.model.layers.1.mlp.down_proj.weight', 'action_head.gemma.model.layers.1.input_layernorm.weight', 'action_head.gemma.model.layers.1.post_attention_layernorm.weight', 'action_head.gemma.model.layers.2.self_attn.q_proj.weight', 'action_head.gemma.model.layers.2.self_attn.k_proj.weight', 'action_head.gemma.model.layers.2.self_attn.v_proj.weight', 'action_head.gemma.model.layers.2.self_attn.o_proj.weight', 'action_head.gemma.model.layers.2.mlp.gate_proj.weight', 'action_head.gemma.model.layers.2.mlp.up_proj.weight', 'action_head.gemma.model.layers.2.mlp.down_proj.weight', 'action_head.gemma.model.layers.2.input_layernorm.weight', 'action_head.gemma.model.layers.2.post_attention_layernorm.weight', 'action_head.gemma.model.layers.3.self_attn.q_proj.weight', 'action_head.gemma.model.layers.3.self_attn.k_proj.weight', 'action_head.gemma.model.layers.3.self_attn.v_proj.weight', 'action_head.gemma.model.layers.3.self_attn.o_proj.weight', 'action_head.gemma.model.layers.3.mlp.gate_proj.weight', 'action_head.gemma.model.layers.3.mlp.up_proj.weight', 'action_head.gemma.model.layers.3.mlp.down_proj.weight', 'action_head.gemma.model.layers.3.input_layernorm.weight', 'action_head.gemma.model.layers.3.post_attention_layernorm.weight', 'action_head.gemma.model.layers.4.self_attn.q_proj.weight', 'action_head.gemma.model.layers.4.self_attn.k_proj.weight', 'action_head.gemma.model.layers.4.self_attn.v_proj.weight', 'action_head.gemma.model.layers.4.self_attn.o_proj.weight', 'action_head.gemma.model.layers.4.mlp.gate_proj.weight', 'action_head.gemma.model.layers.4.mlp.up_proj.weight', 'action_head.gemma.model.layers.4.mlp.down_proj.weight', 'action_head.gemma.model.layers.4.input_layernorm.weight', 'action_head.gemma.model.layers.4.post_attention_layernorm.weight', 'action_head.gemma.model.layers.5.self_attn.q_proj.weight', 'action_head.gemma.model.layers.5.self_attn.k_proj.weight', 'action_head.gemma.model.layers.5.self_attn.v_proj.weight', 'action_head.gemma.model.layers.5.self_attn.o_proj.weight', 'action_head.gemma.model.layers.5.mlp.gate_proj.weight', 'action_head.gemma.model.layers.5.mlp.up_proj.weight', 'action_head.gemma.model.layers.5.mlp.down_proj.weight', 'action_head.gemma.model.layers.5.input_layernorm.weight', 'action_head.gemma.model.layers.5.post_attention_layernorm.weight', 'action_head.gemma.model.layers.6.self_attn.q_proj.weight', 'action_head.gemma.model.layers.6.self_attn.k_proj.weight', 'action_head.gemma.model.layers.6.self_attn.v_proj.weight', 'action_head.gemma.model.layers.6.self_attn.o_proj.weight', 'action_head.gemma.model.layers.6.mlp.gate_proj.weight', 'action_head.gemma.model.layers.6.mlp.up_proj.weight', 'action_head.gemma.model.layers.6.mlp.down_proj.weight', 'action_head.gemma.model.layers.6.input_layernorm.weight', 'action_head.gemma.model.layers.6.post_attention_ +unexpected keys: [] +************************* Initialize model successful! +************************* LoRA flags: use_lora=True, lora_llm=False, lora_vit=False, lora_connector=False +************************* Before add lora to model +************************* Before FSDP model wrapping +************************* FSDP model wrapping successful! +************************* Before building optimizer and scheduler +************* Before get lora params +************* After get lora params successfully +10/05 [16:39:41] INFO | >> Constructing optimizer with 2 param groups optim.py:1283 +************************************************** +After building optimizer and scheduler and model, before training, peak GPU memory (MB): 36856 +************************* VLATrainer initialized successfully! +************************* Before trainer.fit() +Pre-train system metrics + System/Peak GPU Memory (MB)=36,856 +10/05 [16:39:42] WARNING | >> /vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py:200: UserWarning: To copy construct from a tensor, it is recommended to use warnings.py:109 + sourceTensor.detach().clone() or sourceTensor.detach().clone().requires_grad_(True), rather than torch.tensor(sourceTensor). + timestep_list = [torch.tensor(ex["timestep"], dtype=torch.int64) for ex in batch] + +10/05 [16:39:49] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py:967: UserWarning: The .grad attribute warnings.py:109 + of a Tensor that is not a leaf Tensor is being accessed. Its .grad attribute won't be populated during autograd.backward(). If you indeed + want the .grad field to be populated for a non-leaf Tensor, use .retain_grad() on the non-leaf Tensor. If you access the non-leaf Tensor + by mistake, make sure you access the leaf Tensor instead. See github.com/pytorch/pytorch/pull/30531 for more informations. (Triggered + internally at /pytorch/build/aten/src/ATen/core/TensorBody.h:489.) + param_grad = param.grad + +[step=1/500000] + train/ActionNoiseL2Loss=1.711 + throughput/total_tokens=192,000 + System/Peak GPU Memory (MB)=39,644 +[step=2/500000] + train/ActionNoiseL2Loss=1.698 + throughput/total_tokens=384,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,466 +[step=3/500000] + train/ActionNoiseL2Loss=1.651 + throughput/total_tokens=576,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=4/500000] + train/ActionNoiseL2Loss=1.636 + throughput/total_tokens=768,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=5/500000] + train/ActionNoiseL2Loss=1.611 + throughput/total_tokens=960,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6/500000] + train/ActionNoiseL2Loss=1.546 + throughput/total_tokens=1,152,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7/500000] + train/ActionNoiseL2Loss=1.419 + throughput/total_tokens=1,344,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8/500000] + train/ActionNoiseL2Loss=1.455 + throughput/total_tokens=1,536,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9/500000] + train/ActionNoiseL2Loss=1.474 + throughput/total_tokens=1,728,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10/500000] + train/ActionNoiseL2Loss=1.361 + throughput/total_tokens=1,920,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=46,466 +[step=11/500000] + train/ActionNoiseL2Loss=1.384 + throughput/total_tokens=2,112,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=12/500000] + train/ActionNoiseL2Loss=1.290 + throughput/total_tokens=2,304,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=13/500000] + train/ActionNoiseL2Loss=1.316 + throughput/total_tokens=2,496,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=14/500000] + train/ActionNoiseL2Loss=1.381 + throughput/total_tokens=2,688,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=15/500000] + train/ActionNoiseL2Loss=1.237 + throughput/total_tokens=2,880,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=16/500000] + train/ActionNoiseL2Loss=1.354 + throughput/total_tokens=3,072,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=17/500000] + train/ActionNoiseL2Loss=1.300 + throughput/total_tokens=3,264,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=18/500000] + train/ActionNoiseL2Loss=1.377 + throughput/total_tokens=3,456,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=19/500000] + train/ActionNoiseL2Loss=1.326 + throughput/total_tokens=3,648,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=20/500000] + optim/total_grad_norm=19.56 + train/ActionNoiseL2Loss=1.255 + throughput/total_tokens=3,840,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=46,466 +[step=21/500000] + train/ActionNoiseL2Loss=1.270 + throughput/total_tokens=4,032,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=22/500000] + train/ActionNoiseL2Loss=1.208 + throughput/total_tokens=4,224,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=23/500000] + train/ActionNoiseL2Loss=1.275 + throughput/total_tokens=4,416,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=24/500000] + train/ActionNoiseL2Loss=1.252 + throughput/total_tokens=4,608,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=25/500000] + train/ActionNoiseL2Loss=1.169 + throughput/total_tokens=4,800,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=26/500000] + train/ActionNoiseL2Loss=1.164 + throughput/total_tokens=4,992,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=27/500000] + train/ActionNoiseL2Loss=1.225 + throughput/total_tokens=5,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=28/500000] + train/ActionNoiseL2Loss=1.149 + throughput/total_tokens=5,376,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=29/500000] + train/ActionNoiseL2Loss=1.192 + throughput/total_tokens=5,568,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=30/500000] + train/ActionNoiseL2Loss=1.152 + throughput/total_tokens=5,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,466 +[step=31/500000] + train/ActionNoiseL2Loss=1.007 + throughput/total_tokens=5,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=32/500000] + train/ActionNoiseL2Loss=1.041 + throughput/total_tokens=6,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=33/500000] + train/ActionNoiseL2Loss=1.134 + throughput/total_tokens=6,336,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=34/500000] + train/ActionNoiseL2Loss=1.046 + throughput/total_tokens=6,528,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=35/500000] + train/ActionNoiseL2Loss=0.9645 + throughput/total_tokens=6,720,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=36/500000] + train/ActionNoiseL2Loss=1.108 + throughput/total_tokens=6,912,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=37/500000] + train/ActionNoiseL2Loss=0.9956 + throughput/total_tokens=7,104,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=38/500000] + train/ActionNoiseL2Loss=1.090 + throughput/total_tokens=7,296,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=39/500000] + train/ActionNoiseL2Loss=1.005 + throughput/total_tokens=7,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=40/500000] + optim/total_grad_norm=11.64 + train/ActionNoiseL2Loss=0.9402 + throughput/total_tokens=7,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,466 +[step=41/500000] + train/ActionNoiseL2Loss=0.9616 + throughput/total_tokens=7,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=42/500000] + train/ActionNoiseL2Loss=0.9340 + throughput/total_tokens=8,064,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=43/500000] + train/ActionNoiseL2Loss=1.007 + throughput/total_tokens=8,256,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=44/500000] + train/ActionNoiseL2Loss=0.9630 + throughput/total_tokens=8,448,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=45/500000] + train/ActionNoiseL2Loss=0.9288 + throughput/total_tokens=8,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=46/500000] + train/ActionNoiseL2Loss=0.8423 + throughput/total_tokens=8,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=47/500000] + train/ActionNoiseL2Loss=0.9472 + throughput/total_tokens=9,024,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=48/500000] + train/ActionNoiseL2Loss=0.9073 + throughput/total_tokens=9,216,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=49/500000] + train/ActionNoiseL2Loss=0.8192 + throughput/total_tokens=9,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=50/500000] + train/ActionNoiseL2Loss=1.045 + throughput/total_tokens=9,600,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=51/500000] + train/ActionNoiseL2Loss=0.8495 + throughput/total_tokens=9,792,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=52/500000] + train/ActionNoiseL2Loss=0.8396 + throughput/total_tokens=9,984,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=53/500000] + train/ActionNoiseL2Loss=0.8797 + throughput/total_tokens=10,176,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=54/500000] + train/ActionNoiseL2Loss=0.9695 + throughput/total_tokens=10,368,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=55/500000] + train/ActionNoiseL2Loss=0.8790 + throughput/total_tokens=10,560,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=56/500000] + train/ActionNoiseL2Loss=0.8322 + throughput/total_tokens=10,752,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=57/500000] + train/ActionNoiseL2Loss=0.8892 + throughput/total_tokens=10,944,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=58/500000] + train/ActionNoiseL2Loss=0.7627 + throughput/total_tokens=11,136,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=59/500000] + train/ActionNoiseL2Loss=0.9071 + throughput/total_tokens=11,328,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=60/500000] + optim/total_grad_norm=13.59 + train/ActionNoiseL2Loss=0.6764 + throughput/total_tokens=11,520,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=46,466 +[step=61/500000] + train/ActionNoiseL2Loss=0.9854 + throughput/total_tokens=11,712,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=62/500000] + train/ActionNoiseL2Loss=0.7768 + throughput/total_tokens=11,904,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=63/500000] + train/ActionNoiseL2Loss=0.8755 + throughput/total_tokens=12,096,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=64/500000] + train/ActionNoiseL2Loss=0.6781 + throughput/total_tokens=12,288,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=65/500000] + train/ActionNoiseL2Loss=0.8246 + throughput/total_tokens=12,480,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=66/500000] + train/ActionNoiseL2Loss=0.7637 + throughput/total_tokens=12,672,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=67/500000] + train/ActionNoiseL2Loss=0.8331 + throughput/total_tokens=12,864,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=68/500000] + train/ActionNoiseL2Loss=0.7053 + throughput/total_tokens=13,056,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=69/500000] + train/ActionNoiseL2Loss=0.8177 + throughput/total_tokens=13,248,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=70/500000] + train/ActionNoiseL2Loss=0.7359 + throughput/total_tokens=13,440,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,466 +[step=71/500000] + train/ActionNoiseL2Loss=0.7719 + throughput/total_tokens=13,632,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=72/500000] + train/ActionNoiseL2Loss=0.7529 + throughput/total_tokens=13,824,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=73/500000] + train/ActionNoiseL2Loss=0.6464 + throughput/total_tokens=14,016,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=74/500000] + train/ActionNoiseL2Loss=0.6626 + throughput/total_tokens=14,208,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=75/500000] + train/ActionNoiseL2Loss=0.6951 + throughput/total_tokens=14,400,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=76/500000] + train/ActionNoiseL2Loss=0.7216 + throughput/total_tokens=14,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=77/500000] + train/ActionNoiseL2Loss=0.6879 + throughput/total_tokens=14,784,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=78/500000] + train/ActionNoiseL2Loss=0.6603 + throughput/total_tokens=14,976,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=79/500000] + train/ActionNoiseL2Loss=0.6519 + throughput/total_tokens=15,168,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=80/500000] + optim/total_grad_norm=14.43 + train/ActionNoiseL2Loss=0.6805 + throughput/total_tokens=15,360,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,466 +[step=81/500000] + train/ActionNoiseL2Loss=0.7405 + throughput/total_tokens=15,552,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=82/500000] + train/ActionNoiseL2Loss=0.7458 + throughput/total_tokens=15,744,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=83/500000] + train/ActionNoiseL2Loss=0.6622 + throughput/total_tokens=15,936,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=84/500000] + train/ActionNoiseL2Loss=0.6817 + throughput/total_tokens=16,128,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=85/500000] + train/ActionNoiseL2Loss=0.7840 + throughput/total_tokens=16,320,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=86/500000] + train/ActionNoiseL2Loss=0.5672 + throughput/total_tokens=16,512,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=87/500000] + train/ActionNoiseL2Loss=0.5946 + throughput/total_tokens=16,704,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=88/500000] + train/ActionNoiseL2Loss=0.5877 + throughput/total_tokens=16,896,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=89/500000] + train/ActionNoiseL2Loss=0.7036 + throughput/total_tokens=17,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=90/500000] + train/ActionNoiseL2Loss=0.6358 + throughput/total_tokens=17,280,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=91/500000] + train/ActionNoiseL2Loss=0.7254 + throughput/total_tokens=17,472,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=92/500000] + train/ActionNoiseL2Loss=0.6251 + throughput/total_tokens=17,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=93/500000] + train/ActionNoiseL2Loss=0.5787 + throughput/total_tokens=17,856,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=94/500000] + train/ActionNoiseL2Loss=0.6345 + throughput/total_tokens=18,048,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=95/500000] + train/ActionNoiseL2Loss=0.6270 + throughput/total_tokens=18,240,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=96/500000] + train/ActionNoiseL2Loss=0.5564 + throughput/total_tokens=18,432,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=97/500000] + train/ActionNoiseL2Loss=0.4934 + throughput/total_tokens=18,624,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=98/500000] + train/ActionNoiseL2Loss=0.5975 + throughput/total_tokens=18,816,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=99/500000] + train/ActionNoiseL2Loss=0.4990 + throughput/total_tokens=19,008,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=100/500000] + optim/total_grad_norm=13.41 + train/ActionNoiseL2Loss=0.5755 + throughput/total_tokens=19,200,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=101/500000] + train/ActionNoiseL2Loss=0.5912 + throughput/total_tokens=19,392,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=102/500000] + train/ActionNoiseL2Loss=0.5059 + throughput/total_tokens=19,584,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=103/500000] + train/ActionNoiseL2Loss=0.4413 + throughput/total_tokens=19,776,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=104/500000] + train/ActionNoiseL2Loss=0.4823 + throughput/total_tokens=19,968,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=105/500000] + train/ActionNoiseL2Loss=0.5281 + throughput/total_tokens=20,160,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=106/500000] + train/ActionNoiseL2Loss=0.4404 + throughput/total_tokens=20,352,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=107/500000] + train/ActionNoiseL2Loss=0.5314 + throughput/total_tokens=20,544,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=108/500000] + train/ActionNoiseL2Loss=0.4968 + throughput/total_tokens=20,736,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=109/500000] + train/ActionNoiseL2Loss=0.4409 + throughput/total_tokens=20,928,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=110/500000] + train/ActionNoiseL2Loss=0.3875 + throughput/total_tokens=21,120,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=46,466 +[step=111/500000] + train/ActionNoiseL2Loss=0.4903 + throughput/total_tokens=21,312,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=112/500000] + train/ActionNoiseL2Loss=0.5794 + throughput/total_tokens=21,504,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=113/500000] + train/ActionNoiseL2Loss=0.4237 + throughput/total_tokens=21,696,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=114/500000] + train/ActionNoiseL2Loss=0.5765 + throughput/total_tokens=21,888,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=115/500000] + train/ActionNoiseL2Loss=0.5300 + throughput/total_tokens=22,080,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=116/500000] + train/ActionNoiseL2Loss=0.4093 + throughput/total_tokens=22,272,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=117/500000] + train/ActionNoiseL2Loss=0.4724 + throughput/total_tokens=22,464,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=118/500000] + train/ActionNoiseL2Loss=0.4987 + throughput/total_tokens=22,656,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=119/500000] + train/ActionNoiseL2Loss=0.4903 + throughput/total_tokens=22,848,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=120/500000] + optim/total_grad_norm=17.07 + train/ActionNoiseL2Loss=0.4504 + throughput/total_tokens=23,040,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,466 +[step=121/500000] + train/ActionNoiseL2Loss=0.4391 + throughput/total_tokens=23,232,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=122/500000] + train/ActionNoiseL2Loss=0.4652 + throughput/total_tokens=23,424,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=123/500000] + train/ActionNoiseL2Loss=0.4927 + throughput/total_tokens=23,616,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=124/500000] + train/ActionNoiseL2Loss=0.4447 + throughput/total_tokens=23,808,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=125/500000] + train/ActionNoiseL2Loss=0.3505 + throughput/total_tokens=24,000,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=126/500000] + train/ActionNoiseL2Loss=0.4723 + throughput/total_tokens=24,192,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=127/500000] + train/ActionNoiseL2Loss=0.3640 + throughput/total_tokens=24,384,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=128/500000] + train/ActionNoiseL2Loss=0.5643 + throughput/total_tokens=24,576,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=129/500000] + train/ActionNoiseL2Loss=0.3519 + throughput/total_tokens=24,768,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=130/500000] + train/ActionNoiseL2Loss=0.3400 + throughput/total_tokens=24,960,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,466 +[step=131/500000] + train/ActionNoiseL2Loss=0.4919 + throughput/total_tokens=25,152,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=132/500000] + train/ActionNoiseL2Loss=0.3536 + throughput/total_tokens=25,344,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=133/500000] + train/ActionNoiseL2Loss=0.5535 + throughput/total_tokens=25,536,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=134/500000] + train/ActionNoiseL2Loss=0.3842 + throughput/total_tokens=25,728,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=135/500000] + train/ActionNoiseL2Loss=0.4293 + throughput/total_tokens=25,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=136/500000] + train/ActionNoiseL2Loss=0.3861 + throughput/total_tokens=26,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=137/500000] + train/ActionNoiseL2Loss=0.4180 + throughput/total_tokens=26,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=138/500000] + train/ActionNoiseL2Loss=0.4714 + throughput/total_tokens=26,496,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=139/500000] + train/ActionNoiseL2Loss=0.3852 + throughput/total_tokens=26,688,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=140/500000] + optim/total_grad_norm=15.81 + train/ActionNoiseL2Loss=0.4274 + throughput/total_tokens=26,880,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,466 +[step=141/500000] + train/ActionNoiseL2Loss=0.3446 + throughput/total_tokens=27,072,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=142/500000] + train/ActionNoiseL2Loss=0.3610 + throughput/total_tokens=27,264,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=143/500000] + train/ActionNoiseL2Loss=0.3833 + throughput/total_tokens=27,456,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=144/500000] + train/ActionNoiseL2Loss=0.3995 + throughput/total_tokens=27,648,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=145/500000] + train/ActionNoiseL2Loss=0.4719 + throughput/total_tokens=27,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=146/500000] + train/ActionNoiseL2Loss=0.4369 + throughput/total_tokens=28,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=147/500000] + train/ActionNoiseL2Loss=0.3257 + throughput/total_tokens=28,224,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=148/500000] + train/ActionNoiseL2Loss=0.2642 + throughput/total_tokens=28,416,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=149/500000] + train/ActionNoiseL2Loss=0.2961 + throughput/total_tokens=28,608,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=150/500000] + train/ActionNoiseL2Loss=0.3745 + throughput/total_tokens=28,800,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,466 +[step=151/500000] + train/ActionNoiseL2Loss=0.3050 + throughput/total_tokens=28,992,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=152/500000] + train/ActionNoiseL2Loss=0.4770 + throughput/total_tokens=29,184,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=153/500000] + train/ActionNoiseL2Loss=0.4311 + throughput/total_tokens=29,376,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=154/500000] + train/ActionNoiseL2Loss=0.4234 + throughput/total_tokens=29,568,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=155/500000] + train/ActionNoiseL2Loss=0.4054 + throughput/total_tokens=29,760,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=156/500000] + train/ActionNoiseL2Loss=0.3532 + throughput/total_tokens=29,952,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=157/500000] + train/ActionNoiseL2Loss=0.5509 + throughput/total_tokens=30,144,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=158/500000] + train/ActionNoiseL2Loss=0.3456 + throughput/total_tokens=30,336,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=159/500000] + train/ActionNoiseL2Loss=0.3035 + throughput/total_tokens=30,528,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=160/500000] + optim/total_grad_norm=16.46 + train/ActionNoiseL2Loss=0.4799 + throughput/total_tokens=30,720,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=46,466 +[step=161/500000] + train/ActionNoiseL2Loss=0.4429 + throughput/total_tokens=30,912,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=162/500000] + train/ActionNoiseL2Loss=0.3135 + throughput/total_tokens=31,104,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=163/500000] + train/ActionNoiseL2Loss=0.3405 + throughput/total_tokens=31,296,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=164/500000] + train/ActionNoiseL2Loss=0.3602 + throughput/total_tokens=31,488,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=165/500000] + train/ActionNoiseL2Loss=0.3595 + throughput/total_tokens=31,680,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=166/500000] + train/ActionNoiseL2Loss=0.3893 + throughput/total_tokens=31,872,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=167/500000] + train/ActionNoiseL2Loss=0.2995 + throughput/total_tokens=32,064,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=168/500000] + train/ActionNoiseL2Loss=0.4231 + throughput/total_tokens=32,256,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=169/500000] + train/ActionNoiseL2Loss=0.4257 + throughput/total_tokens=32,448,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=170/500000] + train/ActionNoiseL2Loss=0.3783 + throughput/total_tokens=32,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,466 +[step=171/500000] + train/ActionNoiseL2Loss=0.4183 + throughput/total_tokens=32,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=172/500000] + train/ActionNoiseL2Loss=0.3231 + throughput/total_tokens=33,024,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=173/500000] + train/ActionNoiseL2Loss=0.3690 + throughput/total_tokens=33,216,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=174/500000] + train/ActionNoiseL2Loss=0.3955 + throughput/total_tokens=33,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=175/500000] + train/ActionNoiseL2Loss=0.4930 + throughput/total_tokens=33,600,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=176/500000] + train/ActionNoiseL2Loss=0.2896 + throughput/total_tokens=33,792,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=177/500000] + train/ActionNoiseL2Loss=0.3874 + throughput/total_tokens=33,984,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=178/500000] + train/ActionNoiseL2Loss=0.4812 + throughput/total_tokens=34,176,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=179/500000] + train/ActionNoiseL2Loss=0.4097 + throughput/total_tokens=34,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=180/500000] + optim/total_grad_norm=9.927 + train/ActionNoiseL2Loss=0.2756 + throughput/total_tokens=34,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=181/500000] + train/ActionNoiseL2Loss=0.2985 + throughput/total_tokens=34,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=182/500000] + train/ActionNoiseL2Loss=0.3616 + throughput/total_tokens=34,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=183/500000] + train/ActionNoiseL2Loss=0.3452 + throughput/total_tokens=35,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=184/500000] + train/ActionNoiseL2Loss=0.4194 + throughput/total_tokens=35,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=185/500000] + train/ActionNoiseL2Loss=0.3636 + throughput/total_tokens=35,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=186/500000] + train/ActionNoiseL2Loss=0.3450 + throughput/total_tokens=35,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=187/500000] + train/ActionNoiseL2Loss=0.2394 + throughput/total_tokens=35,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=188/500000] + train/ActionNoiseL2Loss=0.3508 + throughput/total_tokens=36,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=189/500000] + train/ActionNoiseL2Loss=0.4668 + throughput/total_tokens=36,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=190/500000] + train/ActionNoiseL2Loss=0.2431 + throughput/total_tokens=36,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=191/500000] + train/ActionNoiseL2Loss=0.3283 + throughput/total_tokens=36,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=192/500000] + train/ActionNoiseL2Loss=0.2934 + throughput/total_tokens=36,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=193/500000] + train/ActionNoiseL2Loss=0.2510 + throughput/total_tokens=37,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=194/500000] + train/ActionNoiseL2Loss=0.3387 + throughput/total_tokens=37,248,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=195/500000] + train/ActionNoiseL2Loss=0.3940 + throughput/total_tokens=37,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=196/500000] + train/ActionNoiseL2Loss=0.3173 + throughput/total_tokens=37,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=197/500000] + train/ActionNoiseL2Loss=0.3372 + throughput/total_tokens=37,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=198/500000] + train/ActionNoiseL2Loss=0.2423 + throughput/total_tokens=38,016,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=199/500000] + train/ActionNoiseL2Loss=0.2778 + throughput/total_tokens=38,208,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=200/500000] + optim/total_grad_norm=13.85 + train/ActionNoiseL2Loss=0.2841 + throughput/total_tokens=38,400,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=201/500000] + train/ActionNoiseL2Loss=0.2260 + throughput/total_tokens=38,592,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=202/500000] + train/ActionNoiseL2Loss=0.3997 + throughput/total_tokens=38,784,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=203/500000] + train/ActionNoiseL2Loss=0.2602 + throughput/total_tokens=38,976,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=204/500000] + train/ActionNoiseL2Loss=0.3861 + throughput/total_tokens=39,168,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=205/500000] + train/ActionNoiseL2Loss=0.2941 + throughput/total_tokens=39,360,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=206/500000] + train/ActionNoiseL2Loss=0.2712 + throughput/total_tokens=39,552,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=207/500000] + train/ActionNoiseL2Loss=0.4389 + throughput/total_tokens=39,744,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=208/500000] + train/ActionNoiseL2Loss=0.4427 + throughput/total_tokens=39,936,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=209/500000] + train/ActionNoiseL2Loss=0.4194 + throughput/total_tokens=40,128,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=210/500000] + train/ActionNoiseL2Loss=0.3214 + throughput/total_tokens=40,320,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 + System/Peak GPU Memory (MB)=46,466 +[step=211/500000] + train/ActionNoiseL2Loss=0.4849 + throughput/total_tokens=40,512,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=212/500000] + train/ActionNoiseL2Loss=0.3849 + throughput/total_tokens=40,704,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=213/500000] + train/ActionNoiseL2Loss=0.4382 + throughput/total_tokens=40,896,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=214/500000] + train/ActionNoiseL2Loss=0.2670 + throughput/total_tokens=41,088,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=215/500000] + train/ActionNoiseL2Loss=0.3889 + throughput/total_tokens=41,280,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=216/500000] + train/ActionNoiseL2Loss=0.4537 + throughput/total_tokens=41,472,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=217/500000] + train/ActionNoiseL2Loss=0.2969 + throughput/total_tokens=41,664,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=218/500000] + train/ActionNoiseL2Loss=0.3676 + throughput/total_tokens=41,856,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=219/500000] + train/ActionNoiseL2Loss=0.3395 + throughput/total_tokens=42,048,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=220/500000] + optim/total_grad_norm=16.22 + train/ActionNoiseL2Loss=0.4704 + throughput/total_tokens=42,240,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=221/500000] + train/ActionNoiseL2Loss=0.2372 + throughput/total_tokens=42,432,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=222/500000] + train/ActionNoiseL2Loss=0.3106 + throughput/total_tokens=42,624,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=223/500000] + train/ActionNoiseL2Loss=0.2358 + throughput/total_tokens=42,816,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=224/500000] + train/ActionNoiseL2Loss=0.2844 + throughput/total_tokens=43,008,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=225/500000] + train/ActionNoiseL2Loss=0.3418 + throughput/total_tokens=43,200,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=226/500000] + train/ActionNoiseL2Loss=0.5291 + throughput/total_tokens=43,392,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=227/500000] + train/ActionNoiseL2Loss=0.3510 + throughput/total_tokens=43,584,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=228/500000] + train/ActionNoiseL2Loss=0.3234 + throughput/total_tokens=43,776,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=229/500000] + train/ActionNoiseL2Loss=0.4265 + throughput/total_tokens=43,968,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=230/500000] + train/ActionNoiseL2Loss=0.2657 + throughput/total_tokens=44,160,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=231/500000] + train/ActionNoiseL2Loss=0.3734 + throughput/total_tokens=44,352,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=232/500000] + train/ActionNoiseL2Loss=0.2988 + throughput/total_tokens=44,544,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=233/500000] + train/ActionNoiseL2Loss=0.2802 + throughput/total_tokens=44,736,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=234/500000] + train/ActionNoiseL2Loss=0.3248 + throughput/total_tokens=44,928,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=235/500000] + train/ActionNoiseL2Loss=0.3626 + throughput/total_tokens=45,120,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=236/500000] + train/ActionNoiseL2Loss=0.3620 + throughput/total_tokens=45,312,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=237/500000] + train/ActionNoiseL2Loss=0.3042 + throughput/total_tokens=45,504,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=238/500000] + train/ActionNoiseL2Loss=0.2510 + throughput/total_tokens=45,696,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=239/500000] + train/ActionNoiseL2Loss=0.2635 + throughput/total_tokens=45,888,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=240/500000] + optim/total_grad_norm=13.75 + train/ActionNoiseL2Loss=0.3792 + throughput/total_tokens=46,080,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=241/500000] + train/ActionNoiseL2Loss=0.3180 + throughput/total_tokens=46,272,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=242/500000] + train/ActionNoiseL2Loss=0.3498 + throughput/total_tokens=46,464,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=243/500000] + train/ActionNoiseL2Loss=0.3461 + throughput/total_tokens=46,656,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=244/500000] + train/ActionNoiseL2Loss=0.3298 + throughput/total_tokens=46,848,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=245/500000] + train/ActionNoiseL2Loss=0.3071 + throughput/total_tokens=47,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=246/500000] + train/ActionNoiseL2Loss=0.2733 + throughput/total_tokens=47,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=247/500000] + train/ActionNoiseL2Loss=0.3533 + throughput/total_tokens=47,424,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=248/500000] + train/ActionNoiseL2Loss=0.2984 + throughput/total_tokens=47,616,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=249/500000] + train/ActionNoiseL2Loss=0.4127 + throughput/total_tokens=47,808,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=250/500000] + train/ActionNoiseL2Loss=0.3070 + throughput/total_tokens=48,000,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,466 +[step=251/500000] + train/ActionNoiseL2Loss=0.2654 + throughput/total_tokens=48,192,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=252/500000] + train/ActionNoiseL2Loss=0.2549 + throughput/total_tokens=48,384,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=253/500000] + train/ActionNoiseL2Loss=0.2911 + throughput/total_tokens=48,576,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=254/500000] + train/ActionNoiseL2Loss=0.2921 + throughput/total_tokens=48,768,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=255/500000] + train/ActionNoiseL2Loss=0.1532 + throughput/total_tokens=48,960,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=256/500000] + train/ActionNoiseL2Loss=0.3352 + throughput/total_tokens=49,152,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=257/500000] + train/ActionNoiseL2Loss=0.2509 + throughput/total_tokens=49,344,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=258/500000] + train/ActionNoiseL2Loss=0.3001 + throughput/total_tokens=49,536,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=259/500000] + train/ActionNoiseL2Loss=0.3455 + throughput/total_tokens=49,728,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=260/500000] + optim/total_grad_norm=9.711 + train/ActionNoiseL2Loss=0.3442 + throughput/total_tokens=49,920,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,466 +[step=261/500000] + train/ActionNoiseL2Loss=0.2571 + throughput/total_tokens=50,112,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=262/500000] + train/ActionNoiseL2Loss=0.2673 + throughput/total_tokens=50,304,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=263/500000] + train/ActionNoiseL2Loss=0.3115 + throughput/total_tokens=50,496,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=264/500000] + train/ActionNoiseL2Loss=0.3249 + throughput/total_tokens=50,688,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=265/500000] + train/ActionNoiseL2Loss=0.3502 + throughput/total_tokens=50,880,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=266/500000] + train/ActionNoiseL2Loss=0.3231 + throughput/total_tokens=51,072,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=267/500000] + train/ActionNoiseL2Loss=0.2726 + throughput/total_tokens=51,264,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=268/500000] + train/ActionNoiseL2Loss=0.2623 + throughput/total_tokens=51,456,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=269/500000] + train/ActionNoiseL2Loss=0.3823 + throughput/total_tokens=51,648,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=270/500000] + train/ActionNoiseL2Loss=0.3436 + throughput/total_tokens=51,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=271/500000] + train/ActionNoiseL2Loss=0.3678 + throughput/total_tokens=52,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=272/500000] + train/ActionNoiseL2Loss=0.2551 + throughput/total_tokens=52,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=273/500000] + train/ActionNoiseL2Loss=0.3505 + throughput/total_tokens=52,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=274/500000] + train/ActionNoiseL2Loss=0.3095 + throughput/total_tokens=52,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=275/500000] + train/ActionNoiseL2Loss=0.2618 + throughput/total_tokens=52,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=276/500000] + train/ActionNoiseL2Loss=0.2933 + throughput/total_tokens=52,992,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=277/500000] + train/ActionNoiseL2Loss=0.3200 + throughput/total_tokens=53,184,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=278/500000] + train/ActionNoiseL2Loss=0.3268 + throughput/total_tokens=53,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=279/500000] + train/ActionNoiseL2Loss=0.3995 + throughput/total_tokens=53,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=280/500000] + optim/total_grad_norm=11.52 + train/ActionNoiseL2Loss=0.3180 + throughput/total_tokens=53,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=281/500000] + train/ActionNoiseL2Loss=0.3418 + throughput/total_tokens=53,952,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=282/500000] + train/ActionNoiseL2Loss=0.3197 + throughput/total_tokens=54,144,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=283/500000] + train/ActionNoiseL2Loss=0.3153 + throughput/total_tokens=54,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=284/500000] + train/ActionNoiseL2Loss=0.3524 + throughput/total_tokens=54,528,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=285/500000] + train/ActionNoiseL2Loss=0.2386 + throughput/total_tokens=54,720,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=286/500000] + train/ActionNoiseL2Loss=0.3045 + throughput/total_tokens=54,912,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=287/500000] + train/ActionNoiseL2Loss=0.3050 + throughput/total_tokens=55,104,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=288/500000] + train/ActionNoiseL2Loss=0.3628 + throughput/total_tokens=55,296,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=289/500000] + train/ActionNoiseL2Loss=0.3522 + throughput/total_tokens=55,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=290/500000] + train/ActionNoiseL2Loss=0.3040 + throughput/total_tokens=55,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=291/500000] + train/ActionNoiseL2Loss=0.3639 + throughput/total_tokens=55,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=292/500000] + train/ActionNoiseL2Loss=0.2567 + throughput/total_tokens=56,064,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=293/500000] + train/ActionNoiseL2Loss=0.3460 + throughput/total_tokens=56,256,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=294/500000] + train/ActionNoiseL2Loss=0.1960 + throughput/total_tokens=56,448,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=295/500000] + train/ActionNoiseL2Loss=0.1998 + throughput/total_tokens=56,640,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=296/500000] + train/ActionNoiseL2Loss=0.2162 + throughput/total_tokens=56,832,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=297/500000] + train/ActionNoiseL2Loss=0.3420 + throughput/total_tokens=57,024,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=298/500000] + train/ActionNoiseL2Loss=0.3057 + throughput/total_tokens=57,216,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=299/500000] + train/ActionNoiseL2Loss=0.2186 + throughput/total_tokens=57,408,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=300/500000] + optim/total_grad_norm=12.62 + train/ActionNoiseL2Loss=0.4661 + throughput/total_tokens=57,600,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,466 +[step=301/500000] + train/ActionNoiseL2Loss=0.3187 + throughput/total_tokens=57,792,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=302/500000] + train/ActionNoiseL2Loss=0.2428 + throughput/total_tokens=57,984,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=303/500000] + train/ActionNoiseL2Loss=0.2177 + throughput/total_tokens=58,176,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=304/500000] + train/ActionNoiseL2Loss=0.2455 + throughput/total_tokens=58,368,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=305/500000] + train/ActionNoiseL2Loss=0.5179 + throughput/total_tokens=58,560,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=306/500000] + train/ActionNoiseL2Loss=0.4437 + throughput/total_tokens=58,752,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=307/500000] + train/ActionNoiseL2Loss=0.4490 + throughput/total_tokens=58,944,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=308/500000] + train/ActionNoiseL2Loss=0.4508 + throughput/total_tokens=59,136,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=309/500000] + train/ActionNoiseL2Loss=0.2981 + throughput/total_tokens=59,328,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=310/500000] + train/ActionNoiseL2Loss=0.3215 + throughput/total_tokens=59,520,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=46,466 +[step=311/500000] + train/ActionNoiseL2Loss=0.3350 + throughput/total_tokens=59,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=312/500000] + train/ActionNoiseL2Loss=0.3001 + throughput/total_tokens=59,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=313/500000] + train/ActionNoiseL2Loss=0.3536 + throughput/total_tokens=60,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=314/500000] + train/ActionNoiseL2Loss=0.2445 + throughput/total_tokens=60,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=315/500000] + train/ActionNoiseL2Loss=0.2404 + throughput/total_tokens=60,480,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=316/500000] + train/ActionNoiseL2Loss=0.1943 + throughput/total_tokens=60,672,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=317/500000] + train/ActionNoiseL2Loss=0.2762 + throughput/total_tokens=60,864,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=318/500000] + train/ActionNoiseL2Loss=0.2686 + throughput/total_tokens=61,056,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=319/500000] + train/ActionNoiseL2Loss=0.3041 + throughput/total_tokens=61,248,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=320/500000] + optim/total_grad_norm=7.028 + train/ActionNoiseL2Loss=0.2336 + throughput/total_tokens=61,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,466 +[step=321/500000] + train/ActionNoiseL2Loss=0.2920 + throughput/total_tokens=61,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=322/500000] + train/ActionNoiseL2Loss=0.4140 + throughput/total_tokens=61,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=323/500000] + train/ActionNoiseL2Loss=0.3569 + throughput/total_tokens=62,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=324/500000] + train/ActionNoiseL2Loss=0.2087 + throughput/total_tokens=62,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=325/500000] + train/ActionNoiseL2Loss=0.3807 + throughput/total_tokens=62,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=326/500000] + train/ActionNoiseL2Loss=0.2785 + throughput/total_tokens=62,592,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=327/500000] + train/ActionNoiseL2Loss=0.3256 + throughput/total_tokens=62,784,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=328/500000] + train/ActionNoiseL2Loss=0.3356 + throughput/total_tokens=62,976,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=329/500000] + train/ActionNoiseL2Loss=0.2529 + throughput/total_tokens=63,168,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=330/500000] + train/ActionNoiseL2Loss=0.4011 + throughput/total_tokens=63,360,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,466 +[step=331/500000] + train/ActionNoiseL2Loss=0.2357 + throughput/total_tokens=63,552,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=332/500000] + train/ActionNoiseL2Loss=0.2525 + throughput/total_tokens=63,744,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=333/500000] + train/ActionNoiseL2Loss=0.2431 + throughput/total_tokens=63,936,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=334/500000] + train/ActionNoiseL2Loss=0.3120 + throughput/total_tokens=64,128,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=335/500000] + train/ActionNoiseL2Loss=0.2144 + throughput/total_tokens=64,320,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=336/500000] + train/ActionNoiseL2Loss=0.1972 + throughput/total_tokens=64,512,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=337/500000] + train/ActionNoiseL2Loss=0.3537 + throughput/total_tokens=64,704,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=338/500000] + train/ActionNoiseL2Loss=0.4004 + throughput/total_tokens=64,896,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=339/500000] + train/ActionNoiseL2Loss=0.3390 + throughput/total_tokens=65,088,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=340/500000] + optim/total_grad_norm=7.133 + train/ActionNoiseL2Loss=0.2351 + throughput/total_tokens=65,280,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=341/500000] + train/ActionNoiseL2Loss=0.3299 + throughput/total_tokens=65,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=342/500000] + train/ActionNoiseL2Loss=0.3317 + throughput/total_tokens=65,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=343/500000] + train/ActionNoiseL2Loss=0.2557 + throughput/total_tokens=65,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=344/500000] + train/ActionNoiseL2Loss=0.1977 + throughput/total_tokens=66,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=345/500000] + train/ActionNoiseL2Loss=0.4197 + throughput/total_tokens=66,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=346/500000] + train/ActionNoiseL2Loss=0.2155 + throughput/total_tokens=66,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=347/500000] + train/ActionNoiseL2Loss=0.1730 + throughput/total_tokens=66,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=348/500000] + train/ActionNoiseL2Loss=0.2363 + throughput/total_tokens=66,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=349/500000] + train/ActionNoiseL2Loss=0.4767 + throughput/total_tokens=67,008,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=350/500000] + train/ActionNoiseL2Loss=0.2365 + throughput/total_tokens=67,200,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=351/500000] + train/ActionNoiseL2Loss=0.3061 + throughput/total_tokens=67,392,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=352/500000] + train/ActionNoiseL2Loss=0.2718 + throughput/total_tokens=67,584,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=353/500000] + train/ActionNoiseL2Loss=0.2815 + throughput/total_tokens=67,776,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=354/500000] + train/ActionNoiseL2Loss=0.2393 + throughput/total_tokens=67,968,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=355/500000] + train/ActionNoiseL2Loss=0.3487 + throughput/total_tokens=68,160,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=356/500000] + train/ActionNoiseL2Loss=0.3844 + throughput/total_tokens=68,352,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=357/500000] + train/ActionNoiseL2Loss=0.3247 + throughput/total_tokens=68,544,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=358/500000] + train/ActionNoiseL2Loss=0.3342 + throughput/total_tokens=68,736,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=359/500000] + train/ActionNoiseL2Loss=0.2114 + throughput/total_tokens=68,928,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=360/500000] + optim/total_grad_norm=9.202 + train/ActionNoiseL2Loss=0.2267 + throughput/total_tokens=69,120,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=46,466 +[step=361/500000] + train/ActionNoiseL2Loss=0.2105 + throughput/total_tokens=69,312,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=362/500000] + train/ActionNoiseL2Loss=0.4571 + throughput/total_tokens=69,504,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=363/500000] + train/ActionNoiseL2Loss=0.2843 + throughput/total_tokens=69,696,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=364/500000] + train/ActionNoiseL2Loss=0.3466 + throughput/total_tokens=69,888,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=365/500000] + train/ActionNoiseL2Loss=0.3181 + throughput/total_tokens=70,080,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=366/500000] + train/ActionNoiseL2Loss=0.2644 + throughput/total_tokens=70,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=367/500000] + train/ActionNoiseL2Loss=0.3030 + throughput/total_tokens=70,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=368/500000] + train/ActionNoiseL2Loss=0.2316 + throughput/total_tokens=70,656,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=369/500000] + train/ActionNoiseL2Loss=0.2234 + throughput/total_tokens=70,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=370/500000] + train/ActionNoiseL2Loss=0.2448 + throughput/total_tokens=71,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=371/500000] + train/ActionNoiseL2Loss=0.2694 + throughput/total_tokens=71,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=372/500000] + train/ActionNoiseL2Loss=0.2434 + throughput/total_tokens=71,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=373/500000] + train/ActionNoiseL2Loss=0.2161 + throughput/total_tokens=71,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=374/500000] + train/ActionNoiseL2Loss=0.3969 + throughput/total_tokens=71,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=375/500000] + train/ActionNoiseL2Loss=0.2917 + throughput/total_tokens=72,000,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=376/500000] + train/ActionNoiseL2Loss=0.2661 + throughput/total_tokens=72,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=377/500000] + train/ActionNoiseL2Loss=0.3134 + throughput/total_tokens=72,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=378/500000] + train/ActionNoiseL2Loss=0.2537 + throughput/total_tokens=72,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=379/500000] + train/ActionNoiseL2Loss=0.2826 + throughput/total_tokens=72,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=380/500000] + optim/total_grad_norm=7.719 + train/ActionNoiseL2Loss=0.2282 + throughput/total_tokens=72,960,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=381/500000] + train/ActionNoiseL2Loss=0.1667 + throughput/total_tokens=73,152,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=382/500000] + train/ActionNoiseL2Loss=0.1876 + throughput/total_tokens=73,344,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=383/500000] + train/ActionNoiseL2Loss=0.4317 + throughput/total_tokens=73,536,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=384/500000] + train/ActionNoiseL2Loss=0.2940 + throughput/total_tokens=73,728,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=385/500000] + train/ActionNoiseL2Loss=0.2537 + throughput/total_tokens=73,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=386/500000] + train/ActionNoiseL2Loss=0.3490 + throughput/total_tokens=74,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=387/500000] + train/ActionNoiseL2Loss=0.3129 + throughput/total_tokens=74,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=388/500000] + train/ActionNoiseL2Loss=0.2908 + throughput/total_tokens=74,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=389/500000] + train/ActionNoiseL2Loss=0.2492 + throughput/total_tokens=74,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=390/500000] + train/ActionNoiseL2Loss=0.1712 + throughput/total_tokens=74,880,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=391/500000] + train/ActionNoiseL2Loss=0.4088 + throughput/total_tokens=75,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=392/500000] + train/ActionNoiseL2Loss=0.3243 + throughput/total_tokens=75,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=393/500000] + train/ActionNoiseL2Loss=0.3172 + throughput/total_tokens=75,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=394/500000] + train/ActionNoiseL2Loss=0.2903 + throughput/total_tokens=75,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=395/500000] + train/ActionNoiseL2Loss=0.3074 + throughput/total_tokens=75,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=396/500000] + train/ActionNoiseL2Loss=0.2387 + throughput/total_tokens=76,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=397/500000] + train/ActionNoiseL2Loss=0.3237 + throughput/total_tokens=76,224,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=398/500000] + train/ActionNoiseL2Loss=0.2034 + throughput/total_tokens=76,416,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=399/500000] + train/ActionNoiseL2Loss=0.2288 + throughput/total_tokens=76,608,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=400/500000] + optim/total_grad_norm=7.945 + train/ActionNoiseL2Loss=0.2459 + throughput/total_tokens=76,800,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,466 +[step=401/500000] + train/ActionNoiseL2Loss=0.2159 + throughput/total_tokens=76,992,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=402/500000] + train/ActionNoiseL2Loss=0.1778 + throughput/total_tokens=77,184,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=403/500000] + train/ActionNoiseL2Loss=0.1946 + throughput/total_tokens=77,376,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=404/500000] + train/ActionNoiseL2Loss=0.2782 + throughput/total_tokens=77,568,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=405/500000] + train/ActionNoiseL2Loss=0.2074 + throughput/total_tokens=77,760,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=406/500000] + train/ActionNoiseL2Loss=0.1906 + throughput/total_tokens=77,952,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=407/500000] + train/ActionNoiseL2Loss=0.2324 + throughput/total_tokens=78,144,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=408/500000] + train/ActionNoiseL2Loss=0.1978 + throughput/total_tokens=78,336,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=409/500000] + train/ActionNoiseL2Loss=0.2839 + throughput/total_tokens=78,528,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=410/500000] + train/ActionNoiseL2Loss=0.3131 + throughput/total_tokens=78,720,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=46,466 +[step=411/500000] + train/ActionNoiseL2Loss=0.2657 + throughput/total_tokens=78,912,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=412/500000] + train/ActionNoiseL2Loss=0.3146 + throughput/total_tokens=79,104,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=413/500000] + train/ActionNoiseL2Loss=0.3510 + throughput/total_tokens=79,296,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=414/500000] + train/ActionNoiseL2Loss=0.2556 + throughput/total_tokens=79,488,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=415/500000] + train/ActionNoiseL2Loss=0.2458 + throughput/total_tokens=79,680,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=416/500000] + train/ActionNoiseL2Loss=0.3135 + throughput/total_tokens=79,872,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=417/500000] + train/ActionNoiseL2Loss=0.2128 + throughput/total_tokens=80,064,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=418/500000] + train/ActionNoiseL2Loss=0.1872 + throughput/total_tokens=80,256,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=419/500000] + train/ActionNoiseL2Loss=0.3437 + throughput/total_tokens=80,448,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=420/500000] + optim/total_grad_norm=8.653 + train/ActionNoiseL2Loss=0.3326 + throughput/total_tokens=80,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=421/500000] + train/ActionNoiseL2Loss=0.3532 + throughput/total_tokens=80,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=422/500000] + train/ActionNoiseL2Loss=0.2250 + throughput/total_tokens=81,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=423/500000] + train/ActionNoiseL2Loss=0.2724 + throughput/total_tokens=81,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=424/500000] + train/ActionNoiseL2Loss=0.1755 + throughput/total_tokens=81,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=425/500000] + train/ActionNoiseL2Loss=0.3186 + throughput/total_tokens=81,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=426/500000] + train/ActionNoiseL2Loss=0.2134 + throughput/total_tokens=81,792,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=427/500000] + train/ActionNoiseL2Loss=0.2484 + throughput/total_tokens=81,984,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=428/500000] + train/ActionNoiseL2Loss=0.2241 + throughput/total_tokens=82,176,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=429/500000] + train/ActionNoiseL2Loss=0.3050 + throughput/total_tokens=82,368,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=430/500000] + train/ActionNoiseL2Loss=0.1886 + throughput/total_tokens=82,560,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=431/500000] + train/ActionNoiseL2Loss=0.2840 + throughput/total_tokens=82,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=432/500000] + train/ActionNoiseL2Loss=0.2117 + throughput/total_tokens=82,944,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=433/500000] + train/ActionNoiseL2Loss=0.2651 + throughput/total_tokens=83,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=434/500000] + train/ActionNoiseL2Loss=0.1964 + throughput/total_tokens=83,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=435/500000] + train/ActionNoiseL2Loss=0.2252 + throughput/total_tokens=83,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=436/500000] + train/ActionNoiseL2Loss=0.2299 + throughput/total_tokens=83,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=437/500000] + train/ActionNoiseL2Loss=0.3338 + throughput/total_tokens=83,904,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=438/500000] + train/ActionNoiseL2Loss=0.2241 + throughput/total_tokens=84,096,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=439/500000] + train/ActionNoiseL2Loss=0.2351 + throughput/total_tokens=84,288,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=440/500000] + optim/total_grad_norm=6.954 + train/ActionNoiseL2Loss=0.1992 + throughput/total_tokens=84,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=441/500000] + train/ActionNoiseL2Loss=0.2223 + throughput/total_tokens=84,672,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=442/500000] + train/ActionNoiseL2Loss=0.2667 + throughput/total_tokens=84,864,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=443/500000] + train/ActionNoiseL2Loss=0.2470 + throughput/total_tokens=85,056,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=444/500000] + train/ActionNoiseL2Loss=0.2799 + throughput/total_tokens=85,248,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=445/500000] + train/ActionNoiseL2Loss=0.2792 + throughput/total_tokens=85,440,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=446/500000] + train/ActionNoiseL2Loss=0.1877 + throughput/total_tokens=85,632,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=447/500000] + train/ActionNoiseL2Loss=0.2279 + throughput/total_tokens=85,824,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=448/500000] + train/ActionNoiseL2Loss=0.2338 + throughput/total_tokens=86,016,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=449/500000] + train/ActionNoiseL2Loss=0.2011 + throughput/total_tokens=86,208,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=450/500000] + train/ActionNoiseL2Loss=0.2114 + throughput/total_tokens=86,400,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,466 +[step=451/500000] + train/ActionNoiseL2Loss=0.3511 + throughput/total_tokens=86,592,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=452/500000] + train/ActionNoiseL2Loss=0.3130 + throughput/total_tokens=86,784,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=453/500000] + train/ActionNoiseL2Loss=0.4503 + throughput/total_tokens=86,976,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=454/500000] + train/ActionNoiseL2Loss=0.2319 + throughput/total_tokens=87,168,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=455/500000] + train/ActionNoiseL2Loss=0.3364 + throughput/total_tokens=87,360,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=456/500000] + train/ActionNoiseL2Loss=0.3524 + throughput/total_tokens=87,552,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=457/500000] + train/ActionNoiseL2Loss=0.2780 + throughput/total_tokens=87,744,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=458/500000] + train/ActionNoiseL2Loss=0.2519 + throughput/total_tokens=87,936,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=459/500000] + train/ActionNoiseL2Loss=0.1482 + throughput/total_tokens=88,128,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=460/500000] + optim/total_grad_norm=9.562 + train/ActionNoiseL2Loss=0.2558 + throughput/total_tokens=88,320,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=46,466 +[step=461/500000] + train/ActionNoiseL2Loss=0.2768 + throughput/total_tokens=88,512,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=462/500000] + train/ActionNoiseL2Loss=0.3391 + throughput/total_tokens=88,704,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=463/500000] + train/ActionNoiseL2Loss=0.2612 + throughput/total_tokens=88,896,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=464/500000] + train/ActionNoiseL2Loss=0.2583 + throughput/total_tokens=89,088,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=465/500000] + train/ActionNoiseL2Loss=0.2252 + throughput/total_tokens=89,280,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=466/500000] + train/ActionNoiseL2Loss=0.2174 + throughput/total_tokens=89,472,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=467/500000] + train/ActionNoiseL2Loss=0.2611 + throughput/total_tokens=89,664,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=468/500000] + train/ActionNoiseL2Loss=0.3451 + throughput/total_tokens=89,856,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=469/500000] + train/ActionNoiseL2Loss=0.1988 + throughput/total_tokens=90,048,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=470/500000] + train/ActionNoiseL2Loss=0.2812 + throughput/total_tokens=90,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=471/500000] + train/ActionNoiseL2Loss=0.1575 + throughput/total_tokens=90,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=472/500000] + train/ActionNoiseL2Loss=0.1825 + throughput/total_tokens=90,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=473/500000] + train/ActionNoiseL2Loss=0.2531 + throughput/total_tokens=90,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=474/500000] + train/ActionNoiseL2Loss=0.2280 + throughput/total_tokens=91,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=475/500000] + train/ActionNoiseL2Loss=0.2182 + throughput/total_tokens=91,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=476/500000] + train/ActionNoiseL2Loss=0.2411 + throughput/total_tokens=91,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=477/500000] + train/ActionNoiseL2Loss=0.2682 + throughput/total_tokens=91,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=478/500000] + train/ActionNoiseL2Loss=0.1944 + throughput/total_tokens=91,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=479/500000] + train/ActionNoiseL2Loss=0.2605 + throughput/total_tokens=91,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=480/500000] + optim/total_grad_norm=7.446 + train/ActionNoiseL2Loss=0.2277 + throughput/total_tokens=92,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=481/500000] + train/ActionNoiseL2Loss=0.2777 + throughput/total_tokens=92,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=482/500000] + train/ActionNoiseL2Loss=0.2285 + throughput/total_tokens=92,544,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=483/500000] + train/ActionNoiseL2Loss=0.2805 + throughput/total_tokens=92,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=484/500000] + train/ActionNoiseL2Loss=0.2262 + throughput/total_tokens=92,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=485/500000] + train/ActionNoiseL2Loss=0.2389 + throughput/total_tokens=93,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=486/500000] + train/ActionNoiseL2Loss=0.1982 + throughput/total_tokens=93,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=487/500000] + train/ActionNoiseL2Loss=0.2714 + throughput/total_tokens=93,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=488/500000] + train/ActionNoiseL2Loss=0.1825 + throughput/total_tokens=93,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=489/500000] + train/ActionNoiseL2Loss=0.1989 + throughput/total_tokens=93,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=490/500000] + train/ActionNoiseL2Loss=0.2287 + throughput/total_tokens=94,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +[step=491/500000] + train/ActionNoiseL2Loss=0.2095 + throughput/total_tokens=94,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=492/500000] + train/ActionNoiseL2Loss=0.2352 + throughput/total_tokens=94,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=493/500000] + train/ActionNoiseL2Loss=0.1997 + throughput/total_tokens=94,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=494/500000] + train/ActionNoiseL2Loss=0.2190 + throughput/total_tokens=94,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=495/500000] + train/ActionNoiseL2Loss=0.2444 + throughput/total_tokens=95,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=496/500000] + train/ActionNoiseL2Loss=0.3683 + throughput/total_tokens=95,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=497/500000] + train/ActionNoiseL2Loss=0.1889 + throughput/total_tokens=95,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=498/500000] + train/ActionNoiseL2Loss=0.2876 + throughput/total_tokens=95,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=499/500000] + train/ActionNoiseL2Loss=0.2136 + throughput/total_tokens=95,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=500/500000] + optim/total_grad_norm=7.262 + train/ActionNoiseL2Loss=0.1928 + throughput/total_tokens=96,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,466 +10/05 [19:34:25] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/fully_sharded_data_parallel.py:678: warnings.py:109 + FutureWarning: FSDP.state_dict_type() and FSDP.set_state_dict_type() are being deprecated. Please use APIs, get_state_dict() and + set_state_dict(), which can support different parallelisms, FSDP1, FSDP2, DDP. API doc: + https://pytorch.org/docs/stable/distributed.checkpoint.html#torch.distributed.checkpoint.state_dict.get_state_dict .Tutorial: + https://pytorch.org/tutorials/recipes/distributed_checkpoint_recipe.html . + warnings.warn( + + WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:860: UserWarning: warnings.py:109 + `_get_pg_default_device` will be deprecated, it only stays for backward-compatiblity reason. If you need to find a device for object + collectives, please use `_get_object_coll_device`. If you need to query the device types supported by group, please use + `_device_capability(group)`. + warnings.warn( + +10/05 [19:34:27] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:722: FutureWarning: warnings.py:109 + Please use DTensor instead and we are deprecating ShardedTensor. + local_shape = tensor.shape + + WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:739: FutureWarning: warnings.py:109 + Please use DTensor instead and we are deprecating ShardedTensor. + tensor.shape, + + WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:741: FutureWarning: warnings.py:109 + Please use DTensor instead and we are deprecating ShardedTensor. + tensor.dtype, + +10/05 [19:34:32] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/overrides.py:1747: FutureWarning: Please use DTensor warnings.py:109 + instead and we are deprecating ShardedTensor. + result = torch_func_method(public_api, types, args, kwargs) + +10/05 [19:35:04] INFO | >> Saving config... checkpoint.py:608 +10/05 [19:35:41] INFO | >> Saving model state... checkpoint.py:796 +10/05 [19:36:53] INFO | >> Saving optim state... checkpoint.py:811 +10/05 [19:38:23] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=501/500000] + train/ActionNoiseL2Loss=0.2087 + throughput/total_tokens=96,192,000 + throughput/device/tokens_per_second=1,185 + throughput/device/batches_per_second=0.0494 +[step=502/500000] + train/ActionNoiseL2Loss=0.2182 + throughput/total_tokens=96,384,000 + throughput/device/tokens_per_second=1,164 + throughput/device/batches_per_second=0.0485 +[step=503/500000] + train/ActionNoiseL2Loss=0.3199 + throughput/total_tokens=96,576,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=504/500000] + train/ActionNoiseL2Loss=0.3780 + throughput/total_tokens=96,768,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=505/500000] + train/ActionNoiseL2Loss=0.2367 + throughput/total_tokens=96,960,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=506/500000] + train/ActionNoiseL2Loss=0.2166 + throughput/total_tokens=97,152,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=507/500000] + train/ActionNoiseL2Loss=0.1862 + throughput/total_tokens=97,344,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=508/500000] + train/ActionNoiseL2Loss=0.2666 + throughput/total_tokens=97,536,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=509/500000] + train/ActionNoiseL2Loss=0.2350 + throughput/total_tokens=97,728,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=510/500000] + train/ActionNoiseL2Loss=0.2894 + throughput/total_tokens=97,920,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=511/500000] + train/ActionNoiseL2Loss=0.3362 + throughput/total_tokens=98,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=512/500000] + train/ActionNoiseL2Loss=0.3625 + throughput/total_tokens=98,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=513/500000] + train/ActionNoiseL2Loss=0.2234 + throughput/total_tokens=98,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=514/500000] + train/ActionNoiseL2Loss=0.1961 + throughput/total_tokens=98,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=515/500000] + train/ActionNoiseL2Loss=0.2494 + throughput/total_tokens=98,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=516/500000] + train/ActionNoiseL2Loss=0.2212 + throughput/total_tokens=99,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=517/500000] + train/ActionNoiseL2Loss=0.1903 + throughput/total_tokens=99,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=518/500000] + train/ActionNoiseL2Loss=0.2033 + throughput/total_tokens=99,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=519/500000] + train/ActionNoiseL2Loss=0.4027 + throughput/total_tokens=99,648,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=520/500000] + optim/total_grad_norm=8.057 + train/ActionNoiseL2Loss=0.1778 + throughput/total_tokens=99,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=521/500000] + train/ActionNoiseL2Loss=0.2908 + throughput/total_tokens=100,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=522/500000] + train/ActionNoiseL2Loss=0.2126 + throughput/total_tokens=100,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=523/500000] + train/ActionNoiseL2Loss=0.2133 + throughput/total_tokens=100,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=524/500000] + train/ActionNoiseL2Loss=0.3874 + throughput/total_tokens=100,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=525/500000] + train/ActionNoiseL2Loss=0.3500 + throughput/total_tokens=100,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=526/500000] + train/ActionNoiseL2Loss=0.2474 + throughput/total_tokens=100,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=527/500000] + train/ActionNoiseL2Loss=0.2846 + throughput/total_tokens=101,184,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=528/500000] + train/ActionNoiseL2Loss=0.1513 + throughput/total_tokens=101,376,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=529/500000] + train/ActionNoiseL2Loss=0.2118 + throughput/total_tokens=101,568,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=530/500000] + train/ActionNoiseL2Loss=0.3152 + throughput/total_tokens=101,760,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=531/500000] + train/ActionNoiseL2Loss=0.2043 + throughput/total_tokens=101,952,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=532/500000] + train/ActionNoiseL2Loss=0.2872 + throughput/total_tokens=102,144,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=533/500000] + train/ActionNoiseL2Loss=0.4214 + throughput/total_tokens=102,336,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=534/500000] + train/ActionNoiseL2Loss=0.2577 + throughput/total_tokens=102,528,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=535/500000] + train/ActionNoiseL2Loss=0.2693 + throughput/total_tokens=102,720,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=536/500000] + train/ActionNoiseL2Loss=0.2697 + throughput/total_tokens=102,912,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=537/500000] + train/ActionNoiseL2Loss=0.3796 + throughput/total_tokens=103,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=538/500000] + train/ActionNoiseL2Loss=0.3139 + throughput/total_tokens=103,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=539/500000] + train/ActionNoiseL2Loss=0.2533 + throughput/total_tokens=103,488,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=540/500000] + optim/total_grad_norm=5.801 + train/ActionNoiseL2Loss=0.1729 + throughput/total_tokens=103,680,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=541/500000] + train/ActionNoiseL2Loss=0.2041 + throughput/total_tokens=103,872,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=542/500000] + train/ActionNoiseL2Loss=0.1949 + throughput/total_tokens=104,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=543/500000] + train/ActionNoiseL2Loss=0.1801 + throughput/total_tokens=104,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=544/500000] + train/ActionNoiseL2Loss=0.2227 + throughput/total_tokens=104,448,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=545/500000] + train/ActionNoiseL2Loss=0.2091 + throughput/total_tokens=104,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=546/500000] + train/ActionNoiseL2Loss=0.1788 + throughput/total_tokens=104,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=547/500000] + train/ActionNoiseL2Loss=0.1479 + throughput/total_tokens=105,024,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=548/500000] + train/ActionNoiseL2Loss=0.1914 + throughput/total_tokens=105,216,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=549/500000] + train/ActionNoiseL2Loss=0.1918 + throughput/total_tokens=105,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=550/500000] + train/ActionNoiseL2Loss=0.3560 + throughput/total_tokens=105,600,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=551/500000] + train/ActionNoiseL2Loss=0.2625 + throughput/total_tokens=105,792,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=552/500000] + train/ActionNoiseL2Loss=0.1931 + throughput/total_tokens=105,984,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=553/500000] + train/ActionNoiseL2Loss=0.1305 + throughput/total_tokens=106,176,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=554/500000] + train/ActionNoiseL2Loss=0.2568 + throughput/total_tokens=106,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=555/500000] + train/ActionNoiseL2Loss=0.3253 + throughput/total_tokens=106,560,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=556/500000] + train/ActionNoiseL2Loss=0.2456 + throughput/total_tokens=106,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=557/500000] + train/ActionNoiseL2Loss=0.2416 + throughput/total_tokens=106,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=558/500000] + train/ActionNoiseL2Loss=0.2683 + throughput/total_tokens=107,136,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=559/500000] + train/ActionNoiseL2Loss=0.2818 + throughput/total_tokens=107,328,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=560/500000] + optim/total_grad_norm=6.614 + train/ActionNoiseL2Loss=0.1825 + throughput/total_tokens=107,520,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=561/500000] + train/ActionNoiseL2Loss=0.3026 + throughput/total_tokens=107,712,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=562/500000] + train/ActionNoiseL2Loss=0.2234 + throughput/total_tokens=107,904,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=563/500000] + train/ActionNoiseL2Loss=0.2577 + throughput/total_tokens=108,096,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=564/500000] + train/ActionNoiseL2Loss=0.2086 + throughput/total_tokens=108,288,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=565/500000] + train/ActionNoiseL2Loss=0.2015 + throughput/total_tokens=108,480,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=566/500000] + train/ActionNoiseL2Loss=0.2031 + throughput/total_tokens=108,672,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=567/500000] + train/ActionNoiseL2Loss=0.1854 + throughput/total_tokens=108,864,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=568/500000] + train/ActionNoiseL2Loss=0.2938 + throughput/total_tokens=109,056,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=569/500000] + train/ActionNoiseL2Loss=0.1913 + throughput/total_tokens=109,248,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=570/500000] + train/ActionNoiseL2Loss=0.2308 + throughput/total_tokens=109,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=571/500000] + train/ActionNoiseL2Loss=0.2375 + throughput/total_tokens=109,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=572/500000] + train/ActionNoiseL2Loss=0.1750 + throughput/total_tokens=109,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=573/500000] + train/ActionNoiseL2Loss=0.1828 + throughput/total_tokens=110,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=574/500000] + train/ActionNoiseL2Loss=0.1597 + throughput/total_tokens=110,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=575/500000] + train/ActionNoiseL2Loss=0.2161 + throughput/total_tokens=110,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=576/500000] + train/ActionNoiseL2Loss=0.1511 + throughput/total_tokens=110,592,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=577/500000] + train/ActionNoiseL2Loss=0.1903 + throughput/total_tokens=110,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=578/500000] + train/ActionNoiseL2Loss=0.1500 + throughput/total_tokens=110,976,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=579/500000] + train/ActionNoiseL2Loss=0.2779 + throughput/total_tokens=111,168,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=580/500000] + optim/total_grad_norm=10.31 + train/ActionNoiseL2Loss=0.3828 + throughput/total_tokens=111,360,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=581/500000] + train/ActionNoiseL2Loss=0.4160 + throughput/total_tokens=111,552,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=582/500000] + train/ActionNoiseL2Loss=0.1780 + throughput/total_tokens=111,744,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=583/500000] + train/ActionNoiseL2Loss=0.1737 + throughput/total_tokens=111,936,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=584/500000] + train/ActionNoiseL2Loss=0.2419 + throughput/total_tokens=112,128,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=585/500000] + train/ActionNoiseL2Loss=0.1905 + throughput/total_tokens=112,320,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=586/500000] + train/ActionNoiseL2Loss=0.1940 + throughput/total_tokens=112,512,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=587/500000] + train/ActionNoiseL2Loss=0.2068 + throughput/total_tokens=112,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=588/500000] + train/ActionNoiseL2Loss=0.3299 + throughput/total_tokens=112,896,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=589/500000] + train/ActionNoiseL2Loss=0.4491 + throughput/total_tokens=113,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=590/500000] + train/ActionNoiseL2Loss=0.2864 + throughput/total_tokens=113,280,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=591/500000] + train/ActionNoiseL2Loss=0.1557 + throughput/total_tokens=113,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=592/500000] + train/ActionNoiseL2Loss=0.2365 + throughput/total_tokens=113,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=593/500000] + train/ActionNoiseL2Loss=0.2681 + throughput/total_tokens=113,856,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=594/500000] + train/ActionNoiseL2Loss=0.2475 + throughput/total_tokens=114,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=595/500000] + train/ActionNoiseL2Loss=0.2745 + throughput/total_tokens=114,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=596/500000] + train/ActionNoiseL2Loss=0.2442 + throughput/total_tokens=114,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=597/500000] + train/ActionNoiseL2Loss=0.2429 + throughput/total_tokens=114,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=598/500000] + train/ActionNoiseL2Loss=0.1290 + throughput/total_tokens=114,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=599/500000] + train/ActionNoiseL2Loss=0.2431 + throughput/total_tokens=115,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=600/500000] + optim/total_grad_norm=6.195 + train/ActionNoiseL2Loss=0.1877 + throughput/total_tokens=115,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=601/500000] + train/ActionNoiseL2Loss=0.3260 + throughput/total_tokens=115,392,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=602/500000] + train/ActionNoiseL2Loss=0.3196 + throughput/total_tokens=115,584,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=603/500000] + train/ActionNoiseL2Loss=0.1442 + throughput/total_tokens=115,776,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=604/500000] + train/ActionNoiseL2Loss=0.2325 + throughput/total_tokens=115,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=605/500000] + train/ActionNoiseL2Loss=0.2136 + throughput/total_tokens=116,160,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=606/500000] + train/ActionNoiseL2Loss=0.1767 + throughput/total_tokens=116,352,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=607/500000] + train/ActionNoiseL2Loss=0.2378 + throughput/total_tokens=116,544,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=608/500000] + train/ActionNoiseL2Loss=0.1626 + throughput/total_tokens=116,736,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=609/500000] + train/ActionNoiseL2Loss=0.2717 + throughput/total_tokens=116,928,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=610/500000] + train/ActionNoiseL2Loss=0.2069 + throughput/total_tokens=117,120,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,467 +[step=611/500000] + train/ActionNoiseL2Loss=0.2057 + throughput/total_tokens=117,312,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=612/500000] + train/ActionNoiseL2Loss=0.2490 + throughput/total_tokens=117,504,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=613/500000] + train/ActionNoiseL2Loss=0.2048 + throughput/total_tokens=117,696,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=614/500000] + train/ActionNoiseL2Loss=0.1657 + throughput/total_tokens=117,888,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=615/500000] + train/ActionNoiseL2Loss=0.2599 + throughput/total_tokens=118,080,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=616/500000] + train/ActionNoiseL2Loss=0.2653 + throughput/total_tokens=118,272,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=617/500000] + train/ActionNoiseL2Loss=0.2059 + throughput/total_tokens=118,464,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=618/500000] + train/ActionNoiseL2Loss=0.2019 + throughput/total_tokens=118,656,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=619/500000] + train/ActionNoiseL2Loss=0.3406 + throughput/total_tokens=118,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=620/500000] + optim/total_grad_norm=6.753 + train/ActionNoiseL2Loss=0.1745 + throughput/total_tokens=119,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=621/500000] + train/ActionNoiseL2Loss=0.2017 + throughput/total_tokens=119,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=622/500000] + train/ActionNoiseL2Loss=0.2571 + throughput/total_tokens=119,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=623/500000] + train/ActionNoiseL2Loss=0.2342 + throughput/total_tokens=119,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=624/500000] + train/ActionNoiseL2Loss=0.1705 + throughput/total_tokens=119,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=625/500000] + train/ActionNoiseL2Loss=0.2380 + throughput/total_tokens=120,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=626/500000] + train/ActionNoiseL2Loss=0.1745 + throughput/total_tokens=120,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=627/500000] + train/ActionNoiseL2Loss=0.2209 + throughput/total_tokens=120,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=628/500000] + train/ActionNoiseL2Loss=0.3372 + throughput/total_tokens=120,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=629/500000] + train/ActionNoiseL2Loss=0.2650 + throughput/total_tokens=120,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=630/500000] + train/ActionNoiseL2Loss=0.2507 + throughput/total_tokens=120,960,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=631/500000] + train/ActionNoiseL2Loss=0.1582 + throughput/total_tokens=121,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=632/500000] + train/ActionNoiseL2Loss=0.3464 + throughput/total_tokens=121,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=633/500000] + train/ActionNoiseL2Loss=0.1375 + throughput/total_tokens=121,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=634/500000] + train/ActionNoiseL2Loss=0.2557 + throughput/total_tokens=121,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=635/500000] + train/ActionNoiseL2Loss=0.2243 + throughput/total_tokens=121,920,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=636/500000] + train/ActionNoiseL2Loss=0.3021 + throughput/total_tokens=122,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=637/500000] + train/ActionNoiseL2Loss=0.1932 + throughput/total_tokens=122,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=638/500000] + train/ActionNoiseL2Loss=0.3245 + throughput/total_tokens=122,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=639/500000] + train/ActionNoiseL2Loss=0.1926 + throughput/total_tokens=122,688,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=640/500000] + optim/total_grad_norm=6.008 + train/ActionNoiseL2Loss=0.1857 + throughput/total_tokens=122,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=641/500000] + train/ActionNoiseL2Loss=0.2739 + throughput/total_tokens=123,072,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=642/500000] + train/ActionNoiseL2Loss=0.2305 + throughput/total_tokens=123,264,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=643/500000] + train/ActionNoiseL2Loss=0.1972 + throughput/total_tokens=123,456,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=644/500000] + train/ActionNoiseL2Loss=0.2669 + throughput/total_tokens=123,648,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=645/500000] + train/ActionNoiseL2Loss=0.2052 + throughput/total_tokens=123,840,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=646/500000] + train/ActionNoiseL2Loss=0.1829 + throughput/total_tokens=124,032,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=647/500000] + train/ActionNoiseL2Loss=0.1391 + throughput/total_tokens=124,224,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=648/500000] + train/ActionNoiseL2Loss=0.1947 + throughput/total_tokens=124,416,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=649/500000] + train/ActionNoiseL2Loss=0.2332 + throughput/total_tokens=124,608,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=650/500000] + train/ActionNoiseL2Loss=0.1859 + throughput/total_tokens=124,800,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=651/500000] + train/ActionNoiseL2Loss=0.1478 + throughput/total_tokens=124,992,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=652/500000] + train/ActionNoiseL2Loss=0.1474 + throughput/total_tokens=125,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=653/500000] + train/ActionNoiseL2Loss=0.1595 + throughput/total_tokens=125,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=654/500000] + train/ActionNoiseL2Loss=0.1788 + throughput/total_tokens=125,568,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=655/500000] + train/ActionNoiseL2Loss=0.1729 + throughput/total_tokens=125,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=656/500000] + train/ActionNoiseL2Loss=0.1576 + throughput/total_tokens=125,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=657/500000] + train/ActionNoiseL2Loss=0.1463 + throughput/total_tokens=126,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=658/500000] + train/ActionNoiseL2Loss=0.2035 + throughput/total_tokens=126,336,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=659/500000] + train/ActionNoiseL2Loss=0.1840 + throughput/total_tokens=126,528,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=660/500000] + optim/total_grad_norm=11.01 + train/ActionNoiseL2Loss=0.3446 + throughput/total_tokens=126,720,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,467 +[step=661/500000] + train/ActionNoiseL2Loss=0.2969 + throughput/total_tokens=126,912,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=662/500000] + train/ActionNoiseL2Loss=0.1515 + throughput/total_tokens=127,104,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=663/500000] + train/ActionNoiseL2Loss=0.1857 + throughput/total_tokens=127,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=664/500000] + train/ActionNoiseL2Loss=0.3233 + throughput/total_tokens=127,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=665/500000] + train/ActionNoiseL2Loss=0.3120 + throughput/total_tokens=127,680,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=666/500000] + train/ActionNoiseL2Loss=0.2170 + throughput/total_tokens=127,872,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=667/500000] + train/ActionNoiseL2Loss=0.3312 + throughput/total_tokens=128,064,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=668/500000] + train/ActionNoiseL2Loss=0.1254 + throughput/total_tokens=128,256,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=669/500000] + train/ActionNoiseL2Loss=0.2204 + throughput/total_tokens=128,448,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=670/500000] + train/ActionNoiseL2Loss=0.2014 + throughput/total_tokens=128,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=671/500000] + train/ActionNoiseL2Loss=0.1878 + throughput/total_tokens=128,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=672/500000] + train/ActionNoiseL2Loss=0.1793 + throughput/total_tokens=129,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=673/500000] + train/ActionNoiseL2Loss=0.1834 + throughput/total_tokens=129,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=674/500000] + train/ActionNoiseL2Loss=0.1973 + throughput/total_tokens=129,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=675/500000] + train/ActionNoiseL2Loss=0.2031 + throughput/total_tokens=129,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=676/500000] + train/ActionNoiseL2Loss=0.1928 + throughput/total_tokens=129,792,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=677/500000] + train/ActionNoiseL2Loss=0.1547 + throughput/total_tokens=129,984,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=678/500000] + train/ActionNoiseL2Loss=0.1405 + throughput/total_tokens=130,176,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=679/500000] + train/ActionNoiseL2Loss=0.1775 + throughput/total_tokens=130,368,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=680/500000] + optim/total_grad_norm=9.193 + train/ActionNoiseL2Loss=0.3125 + throughput/total_tokens=130,560,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=681/500000] + train/ActionNoiseL2Loss=0.2979 + throughput/total_tokens=130,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=682/500000] + train/ActionNoiseL2Loss=0.2696 + throughput/total_tokens=130,944,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=683/500000] + train/ActionNoiseL2Loss=0.1810 + throughput/total_tokens=131,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=684/500000] + train/ActionNoiseL2Loss=0.2743 + throughput/total_tokens=131,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=685/500000] + train/ActionNoiseL2Loss=0.1870 + throughput/total_tokens=131,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=686/500000] + train/ActionNoiseL2Loss=0.2027 + throughput/total_tokens=131,712,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=687/500000] + train/ActionNoiseL2Loss=0.1459 + throughput/total_tokens=131,904,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=688/500000] + train/ActionNoiseL2Loss=0.2159 + throughput/total_tokens=132,096,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=689/500000] + train/ActionNoiseL2Loss=0.1948 + throughput/total_tokens=132,288,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=690/500000] + train/ActionNoiseL2Loss=0.3235 + throughput/total_tokens=132,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=691/500000] + train/ActionNoiseL2Loss=0.1680 + throughput/total_tokens=132,672,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=692/500000] + train/ActionNoiseL2Loss=0.2157 + throughput/total_tokens=132,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=693/500000] + train/ActionNoiseL2Loss=0.3897 + throughput/total_tokens=133,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=694/500000] + train/ActionNoiseL2Loss=0.1432 + throughput/total_tokens=133,248,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=695/500000] + train/ActionNoiseL2Loss=0.1356 + throughput/total_tokens=133,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=696/500000] + train/ActionNoiseL2Loss=0.3117 + throughput/total_tokens=133,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=697/500000] + train/ActionNoiseL2Loss=0.2154 + throughput/total_tokens=133,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=698/500000] + train/ActionNoiseL2Loss=0.1696 + throughput/total_tokens=134,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=699/500000] + train/ActionNoiseL2Loss=0.1958 + throughput/total_tokens=134,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=700/500000] + optim/total_grad_norm=5.386 + train/ActionNoiseL2Loss=0.1812 + throughput/total_tokens=134,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=701/500000] + train/ActionNoiseL2Loss=0.1815 + throughput/total_tokens=134,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=702/500000] + train/ActionNoiseL2Loss=0.2197 + throughput/total_tokens=134,784,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=703/500000] + train/ActionNoiseL2Loss=0.1800 + throughput/total_tokens=134,976,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=704/500000] + train/ActionNoiseL2Loss=0.2079 + throughput/total_tokens=135,168,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=705/500000] + train/ActionNoiseL2Loss=0.2086 + throughput/total_tokens=135,360,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=706/500000] + train/ActionNoiseL2Loss=0.1530 + throughput/total_tokens=135,552,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=707/500000] + train/ActionNoiseL2Loss=0.2076 + throughput/total_tokens=135,744,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=708/500000] + train/ActionNoiseL2Loss=0.2414 + throughput/total_tokens=135,936,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=709/500000] + train/ActionNoiseL2Loss=0.2028 + throughput/total_tokens=136,128,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=710/500000] + train/ActionNoiseL2Loss=0.2627 + throughput/total_tokens=136,320,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,467 +[step=711/500000] + train/ActionNoiseL2Loss=0.1471 + throughput/total_tokens=136,512,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=712/500000] + train/ActionNoiseL2Loss=0.1326 + throughput/total_tokens=136,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=713/500000] + train/ActionNoiseL2Loss=0.2678 + throughput/total_tokens=136,896,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=714/500000] + train/ActionNoiseL2Loss=0.1930 + throughput/total_tokens=137,088,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=715/500000] + train/ActionNoiseL2Loss=0.2094 + throughput/total_tokens=137,280,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=716/500000] + train/ActionNoiseL2Loss=0.1695 + throughput/total_tokens=137,472,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=717/500000] + train/ActionNoiseL2Loss=0.1769 + throughput/total_tokens=137,664,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=718/500000] + train/ActionNoiseL2Loss=0.2401 + throughput/total_tokens=137,856,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=719/500000] + train/ActionNoiseL2Loss=0.1045 + throughput/total_tokens=138,048,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=720/500000] + optim/total_grad_norm=6.126 + train/ActionNoiseL2Loss=0.2335 + throughput/total_tokens=138,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=721/500000] + train/ActionNoiseL2Loss=0.1847 + throughput/total_tokens=138,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=722/500000] + train/ActionNoiseL2Loss=0.1593 + throughput/total_tokens=138,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=723/500000] + train/ActionNoiseL2Loss=0.2462 + throughput/total_tokens=138,816,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=724/500000] + train/ActionNoiseL2Loss=0.1724 + throughput/total_tokens=139,008,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=725/500000] + train/ActionNoiseL2Loss=0.1466 + throughput/total_tokens=139,200,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=726/500000] + train/ActionNoiseL2Loss=0.1556 + throughput/total_tokens=139,392,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=727/500000] + train/ActionNoiseL2Loss=0.2558 + throughput/total_tokens=139,584,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=728/500000] + train/ActionNoiseL2Loss=0.2288 + throughput/total_tokens=139,776,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=729/500000] + train/ActionNoiseL2Loss=0.2122 + throughput/total_tokens=139,968,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=730/500000] + train/ActionNoiseL2Loss=0.1784 + throughput/total_tokens=140,160,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=731/500000] + train/ActionNoiseL2Loss=0.1478 + throughput/total_tokens=140,352,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=732/500000] + train/ActionNoiseL2Loss=0.1795 + throughput/total_tokens=140,544,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=733/500000] + train/ActionNoiseL2Loss=0.2208 + throughput/total_tokens=140,736,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=734/500000] + train/ActionNoiseL2Loss=0.2184 + throughput/total_tokens=140,928,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=735/500000] + train/ActionNoiseL2Loss=0.1147 + throughput/total_tokens=141,120,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=736/500000] + train/ActionNoiseL2Loss=0.1177 + throughput/total_tokens=141,312,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=737/500000] + train/ActionNoiseL2Loss=0.1888 + throughput/total_tokens=141,504,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=738/500000] + train/ActionNoiseL2Loss=0.1454 + throughput/total_tokens=141,696,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=739/500000] + train/ActionNoiseL2Loss=0.2052 + throughput/total_tokens=141,888,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=740/500000] + optim/total_grad_norm=6.828 + train/ActionNoiseL2Loss=0.2135 + throughput/total_tokens=142,080,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=741/500000] + train/ActionNoiseL2Loss=0.2759 + throughput/total_tokens=142,272,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=742/500000] + train/ActionNoiseL2Loss=0.1680 + throughput/total_tokens=142,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=743/500000] + train/ActionNoiseL2Loss=0.1824 + throughput/total_tokens=142,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=744/500000] + train/ActionNoiseL2Loss=0.1678 + throughput/total_tokens=142,848,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=745/500000] + train/ActionNoiseL2Loss=0.1289 + throughput/total_tokens=143,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=746/500000] + train/ActionNoiseL2Loss=0.1573 + throughput/total_tokens=143,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=747/500000] + train/ActionNoiseL2Loss=0.1985 + throughput/total_tokens=143,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=748/500000] + train/ActionNoiseL2Loss=0.1855 + throughput/total_tokens=143,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=749/500000] + train/ActionNoiseL2Loss=0.1628 + throughput/total_tokens=143,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=750/500000] + train/ActionNoiseL2Loss=0.1845 + throughput/total_tokens=144,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=751/500000] + train/ActionNoiseL2Loss=0.5426 + throughput/total_tokens=144,192,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=752/500000] + train/ActionNoiseL2Loss=0.2420 + throughput/total_tokens=144,384,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=753/500000] + train/ActionNoiseL2Loss=0.2260 + throughput/total_tokens=144,576,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=754/500000] + train/ActionNoiseL2Loss=0.1558 + throughput/total_tokens=144,768,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=755/500000] + train/ActionNoiseL2Loss=0.1615 + throughput/total_tokens=144,960,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=756/500000] + train/ActionNoiseL2Loss=0.2147 + throughput/total_tokens=145,152,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=757/500000] + train/ActionNoiseL2Loss=0.1896 + throughput/total_tokens=145,344,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=758/500000] + train/ActionNoiseL2Loss=0.1276 + throughput/total_tokens=145,536,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=759/500000] + train/ActionNoiseL2Loss=0.1408 + throughput/total_tokens=145,728,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=760/500000] + optim/total_grad_norm=10.05 + train/ActionNoiseL2Loss=0.3849 + throughput/total_tokens=145,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,467 +[step=761/500000] + train/ActionNoiseL2Loss=0.1555 + throughput/total_tokens=146,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=762/500000] + train/ActionNoiseL2Loss=0.2844 + throughput/total_tokens=146,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=763/500000] + train/ActionNoiseL2Loss=0.2017 + throughput/total_tokens=146,496,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=764/500000] + train/ActionNoiseL2Loss=0.1835 + throughput/total_tokens=146,688,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=765/500000] + train/ActionNoiseL2Loss=0.1843 + throughput/total_tokens=146,880,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=766/500000] + train/ActionNoiseL2Loss=0.2072 + throughput/total_tokens=147,072,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=767/500000] + train/ActionNoiseL2Loss=0.1739 + throughput/total_tokens=147,264,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=768/500000] + train/ActionNoiseL2Loss=0.2129 + throughput/total_tokens=147,456,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=769/500000] + train/ActionNoiseL2Loss=0.2075 + throughput/total_tokens=147,648,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=770/500000] + train/ActionNoiseL2Loss=0.2944 + throughput/total_tokens=147,840,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=771/500000] + train/ActionNoiseL2Loss=0.2198 + throughput/total_tokens=148,032,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=772/500000] + train/ActionNoiseL2Loss=0.1625 + throughput/total_tokens=148,224,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=773/500000] + train/ActionNoiseL2Loss=0.2044 + throughput/total_tokens=148,416,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=774/500000] + train/ActionNoiseL2Loss=0.1584 + throughput/total_tokens=148,608,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=775/500000] + train/ActionNoiseL2Loss=0.1491 + throughput/total_tokens=148,800,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=776/500000] + train/ActionNoiseL2Loss=0.2922 + throughput/total_tokens=148,992,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=777/500000] + train/ActionNoiseL2Loss=0.2013 + throughput/total_tokens=149,184,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=778/500000] + train/ActionNoiseL2Loss=0.2546 + throughput/total_tokens=149,376,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=779/500000] + train/ActionNoiseL2Loss=0.2688 + throughput/total_tokens=149,568,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=780/500000] + optim/total_grad_norm=8.487 + train/ActionNoiseL2Loss=0.3384 + throughput/total_tokens=149,760,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=781/500000] + train/ActionNoiseL2Loss=0.1542 + throughput/total_tokens=149,952,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=782/500000] + train/ActionNoiseL2Loss=0.2334 + throughput/total_tokens=150,144,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=783/500000] + train/ActionNoiseL2Loss=0.1761 + throughput/total_tokens=150,336,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=784/500000] + train/ActionNoiseL2Loss=0.1988 + throughput/total_tokens=150,528,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=785/500000] + train/ActionNoiseL2Loss=0.1637 + throughput/total_tokens=150,720,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=786/500000] + train/ActionNoiseL2Loss=0.1710 + throughput/total_tokens=150,912,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=787/500000] + train/ActionNoiseL2Loss=0.2409 + throughput/total_tokens=151,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=788/500000] + train/ActionNoiseL2Loss=0.1470 + throughput/total_tokens=151,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=789/500000] + train/ActionNoiseL2Loss=0.1976 + throughput/total_tokens=151,488,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=790/500000] + train/ActionNoiseL2Loss=0.1870 + throughput/total_tokens=151,680,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=791/500000] + train/ActionNoiseL2Loss=0.2446 + throughput/total_tokens=151,872,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=792/500000] + train/ActionNoiseL2Loss=0.1475 + throughput/total_tokens=152,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=793/500000] + train/ActionNoiseL2Loss=0.1728 + throughput/total_tokens=152,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=794/500000] + train/ActionNoiseL2Loss=0.2579 + throughput/total_tokens=152,448,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=795/500000] + train/ActionNoiseL2Loss=0.1409 + throughput/total_tokens=152,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=796/500000] + train/ActionNoiseL2Loss=0.3345 + throughput/total_tokens=152,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=797/500000] + train/ActionNoiseL2Loss=0.1412 + throughput/total_tokens=153,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=798/500000] + train/ActionNoiseL2Loss=0.1426 + throughput/total_tokens=153,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=799/500000] + train/ActionNoiseL2Loss=0.2317 + throughput/total_tokens=153,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=800/500000] + optim/total_grad_norm=5.194 + train/ActionNoiseL2Loss=0.1213 + throughput/total_tokens=153,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=801/500000] + train/ActionNoiseL2Loss=0.2143 + throughput/total_tokens=153,792,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=802/500000] + train/ActionNoiseL2Loss=0.1647 + throughput/total_tokens=153,984,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=803/500000] + train/ActionNoiseL2Loss=0.1551 + throughput/total_tokens=154,176,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=804/500000] + train/ActionNoiseL2Loss=0.1388 + throughput/total_tokens=154,368,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=805/500000] + train/ActionNoiseL2Loss=0.1441 + throughput/total_tokens=154,560,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=806/500000] + train/ActionNoiseL2Loss=0.1597 + throughput/total_tokens=154,752,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=807/500000] + train/ActionNoiseL2Loss=0.1895 + throughput/total_tokens=154,944,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=808/500000] + train/ActionNoiseL2Loss=0.1377 + throughput/total_tokens=155,136,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=809/500000] + train/ActionNoiseL2Loss=0.1565 + throughput/total_tokens=155,328,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=810/500000] + train/ActionNoiseL2Loss=0.1339 + throughput/total_tokens=155,520,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,467 +[step=811/500000] + train/ActionNoiseL2Loss=0.1091 + throughput/total_tokens=155,712,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=812/500000] + train/ActionNoiseL2Loss=0.2694 + throughput/total_tokens=155,904,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=813/500000] + train/ActionNoiseL2Loss=0.2150 + throughput/total_tokens=156,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=814/500000] + train/ActionNoiseL2Loss=0.1281 + throughput/total_tokens=156,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=815/500000] + train/ActionNoiseL2Loss=0.1304 + throughput/total_tokens=156,480,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=816/500000] + train/ActionNoiseL2Loss=0.2906 + throughput/total_tokens=156,672,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=817/500000] + train/ActionNoiseL2Loss=0.2288 + throughput/total_tokens=156,864,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=818/500000] + train/ActionNoiseL2Loss=0.1955 + throughput/total_tokens=157,056,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=819/500000] + train/ActionNoiseL2Loss=0.1177 + throughput/total_tokens=157,248,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=820/500000] + optim/total_grad_norm=5.987 + train/ActionNoiseL2Loss=0.2220 + throughput/total_tokens=157,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=821/500000] + train/ActionNoiseL2Loss=0.2725 + throughput/total_tokens=157,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=822/500000] + train/ActionNoiseL2Loss=0.1455 + throughput/total_tokens=157,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=823/500000] + train/ActionNoiseL2Loss=0.2124 + throughput/total_tokens=158,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=824/500000] + train/ActionNoiseL2Loss=0.1729 + throughput/total_tokens=158,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=825/500000] + train/ActionNoiseL2Loss=0.2087 + throughput/total_tokens=158,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=826/500000] + train/ActionNoiseL2Loss=0.2296 + throughput/total_tokens=158,592,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=827/500000] + train/ActionNoiseL2Loss=0.2411 + throughput/total_tokens=158,784,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=828/500000] + train/ActionNoiseL2Loss=0.1490 + throughput/total_tokens=158,976,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=829/500000] + train/ActionNoiseL2Loss=0.1650 + throughput/total_tokens=159,168,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=830/500000] + train/ActionNoiseL2Loss=0.1877 + throughput/total_tokens=159,360,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=831/500000] + train/ActionNoiseL2Loss=0.1067 + throughput/total_tokens=159,552,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=832/500000] + train/ActionNoiseL2Loss=0.1074 + throughput/total_tokens=159,744,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=833/500000] + train/ActionNoiseL2Loss=0.2675 + throughput/total_tokens=159,936,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=834/500000] + train/ActionNoiseL2Loss=0.2354 + throughput/total_tokens=160,128,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=835/500000] + train/ActionNoiseL2Loss=0.1469 + throughput/total_tokens=160,320,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=836/500000] + train/ActionNoiseL2Loss=0.1035 + throughput/total_tokens=160,512,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=837/500000] + train/ActionNoiseL2Loss=0.1345 + throughput/total_tokens=160,704,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=838/500000] + train/ActionNoiseL2Loss=0.1453 + throughput/total_tokens=160,896,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=839/500000] + train/ActionNoiseL2Loss=0.1726 + throughput/total_tokens=161,088,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=840/500000] + optim/total_grad_norm=4.207 + train/ActionNoiseL2Loss=0.1240 + throughput/total_tokens=161,280,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=841/500000] + train/ActionNoiseL2Loss=0.2423 + throughput/total_tokens=161,472,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=842/500000] + train/ActionNoiseL2Loss=0.1437 + throughput/total_tokens=161,664,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=843/500000] + train/ActionNoiseL2Loss=0.1514 + throughput/total_tokens=161,856,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=844/500000] + train/ActionNoiseL2Loss=0.1762 + throughput/total_tokens=162,048,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=845/500000] + train/ActionNoiseL2Loss=0.1387 + throughput/total_tokens=162,240,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=846/500000] + train/ActionNoiseL2Loss=0.1502 + throughput/total_tokens=162,432,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=847/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=162,624,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=848/500000] + train/ActionNoiseL2Loss=0.1653 + throughput/total_tokens=162,816,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=849/500000] + train/ActionNoiseL2Loss=0.1716 + throughput/total_tokens=163,008,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=850/500000] + train/ActionNoiseL2Loss=0.1617 + throughput/total_tokens=163,200,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=851/500000] + train/ActionNoiseL2Loss=0.1206 + throughput/total_tokens=163,392,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=852/500000] + train/ActionNoiseL2Loss=0.1781 + throughput/total_tokens=163,584,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=853/500000] + train/ActionNoiseL2Loss=0.1509 + throughput/total_tokens=163,776,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=854/500000] + train/ActionNoiseL2Loss=0.2073 + throughput/total_tokens=163,968,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=855/500000] + train/ActionNoiseL2Loss=0.3320 + throughput/total_tokens=164,160,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=856/500000] + train/ActionNoiseL2Loss=0.1908 + throughput/total_tokens=164,352,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=857/500000] + train/ActionNoiseL2Loss=0.1423 + throughput/total_tokens=164,544,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=858/500000] + train/ActionNoiseL2Loss=0.1977 + throughput/total_tokens=164,736,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=859/500000] + train/ActionNoiseL2Loss=0.4090 + throughput/total_tokens=164,928,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=860/500000] + optim/total_grad_norm=7.457 + train/ActionNoiseL2Loss=0.1968 + throughput/total_tokens=165,120,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=861/500000] + train/ActionNoiseL2Loss=0.2877 + throughput/total_tokens=165,312,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=862/500000] + train/ActionNoiseL2Loss=0.1812 + throughput/total_tokens=165,504,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=863/500000] + train/ActionNoiseL2Loss=0.2658 + throughput/total_tokens=165,696,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=864/500000] + train/ActionNoiseL2Loss=0.2675 + throughput/total_tokens=165,888,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=865/500000] + train/ActionNoiseL2Loss=0.2430 + throughput/total_tokens=166,080,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=866/500000] + train/ActionNoiseL2Loss=0.3858 + throughput/total_tokens=166,272,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=867/500000] + train/ActionNoiseL2Loss=0.2185 + throughput/total_tokens=166,464,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=868/500000] + train/ActionNoiseL2Loss=0.1340 + throughput/total_tokens=166,656,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=869/500000] + train/ActionNoiseL2Loss=0.1298 + throughput/total_tokens=166,848,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=870/500000] + train/ActionNoiseL2Loss=0.2002 + throughput/total_tokens=167,040,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=871/500000] + train/ActionNoiseL2Loss=0.1421 + throughput/total_tokens=167,232,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=872/500000] + train/ActionNoiseL2Loss=0.2525 + throughput/total_tokens=167,424,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=873/500000] + train/ActionNoiseL2Loss=0.1082 + throughput/total_tokens=167,616,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=874/500000] + train/ActionNoiseL2Loss=0.1471 + throughput/total_tokens=167,808,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=875/500000] + train/ActionNoiseL2Loss=0.1409 + throughput/total_tokens=168,000,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=876/500000] + train/ActionNoiseL2Loss=0.1543 + throughput/total_tokens=168,192,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=877/500000] + train/ActionNoiseL2Loss=0.1974 + throughput/total_tokens=168,384,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=878/500000] + train/ActionNoiseL2Loss=0.2057 + throughput/total_tokens=168,576,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=879/500000] + train/ActionNoiseL2Loss=0.1897 + throughput/total_tokens=168,768,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=880/500000] + optim/total_grad_norm=4.874 + train/ActionNoiseL2Loss=0.1360 + throughput/total_tokens=168,960,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=881/500000] + train/ActionNoiseL2Loss=0.1453 + throughput/total_tokens=169,152,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=882/500000] + train/ActionNoiseL2Loss=0.2261 + throughput/total_tokens=169,344,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=883/500000] + train/ActionNoiseL2Loss=0.1268 + throughput/total_tokens=169,536,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=884/500000] + train/ActionNoiseL2Loss=0.1343 + throughput/total_tokens=169,728,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=885/500000] + train/ActionNoiseL2Loss=0.1039 + throughput/total_tokens=169,920,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=886/500000] + train/ActionNoiseL2Loss=0.1419 + throughput/total_tokens=170,112,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=887/500000] + train/ActionNoiseL2Loss=0.1421 + throughput/total_tokens=170,304,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=888/500000] + train/ActionNoiseL2Loss=0.2245 + throughput/total_tokens=170,496,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=889/500000] + train/ActionNoiseL2Loss=0.0909 + throughput/total_tokens=170,688,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=890/500000] + train/ActionNoiseL2Loss=0.1486 + throughput/total_tokens=170,880,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=891/500000] + train/ActionNoiseL2Loss=0.1564 + throughput/total_tokens=171,072,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=892/500000] + train/ActionNoiseL2Loss=0.1540 + throughput/total_tokens=171,264,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=893/500000] + train/ActionNoiseL2Loss=0.1140 + throughput/total_tokens=171,456,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=894/500000] + train/ActionNoiseL2Loss=0.1268 + throughput/total_tokens=171,648,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=895/500000] + train/ActionNoiseL2Loss=0.1692 + throughput/total_tokens=171,840,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=896/500000] + train/ActionNoiseL2Loss=0.1288 + throughput/total_tokens=172,032,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=897/500000] + train/ActionNoiseL2Loss=0.1800 + throughput/total_tokens=172,224,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=898/500000] + train/ActionNoiseL2Loss=0.1615 + throughput/total_tokens=172,416,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=899/500000] + train/ActionNoiseL2Loss=0.1371 + throughput/total_tokens=172,608,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=900/500000] + optim/total_grad_norm=3.508 + train/ActionNoiseL2Loss=0.1152 + throughput/total_tokens=172,800,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=901/500000] + train/ActionNoiseL2Loss=0.1548 + throughput/total_tokens=172,992,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=902/500000] + train/ActionNoiseL2Loss=0.1856 + throughput/total_tokens=173,184,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=903/500000] + train/ActionNoiseL2Loss=0.1886 + throughput/total_tokens=173,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=904/500000] + train/ActionNoiseL2Loss=0.1034 + throughput/total_tokens=173,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=905/500000] + train/ActionNoiseL2Loss=0.1527 + throughput/total_tokens=173,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=906/500000] + train/ActionNoiseL2Loss=0.1990 + throughput/total_tokens=173,952,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=907/500000] + train/ActionNoiseL2Loss=0.1827 + throughput/total_tokens=174,144,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=908/500000] + train/ActionNoiseL2Loss=0.1650 + throughput/total_tokens=174,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=909/500000] + train/ActionNoiseL2Loss=0.1901 + throughput/total_tokens=174,528,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=910/500000] + train/ActionNoiseL2Loss=0.1029 + throughput/total_tokens=174,720,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=911/500000] + train/ActionNoiseL2Loss=0.1589 + throughput/total_tokens=174,912,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=912/500000] + train/ActionNoiseL2Loss=0.1486 + throughput/total_tokens=175,104,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=913/500000] + train/ActionNoiseL2Loss=0.1711 + throughput/total_tokens=175,296,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=914/500000] + train/ActionNoiseL2Loss=0.2283 + throughput/total_tokens=175,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=915/500000] + train/ActionNoiseL2Loss=0.1971 + throughput/total_tokens=175,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=916/500000] + train/ActionNoiseL2Loss=0.1053 + throughput/total_tokens=175,872,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=917/500000] + train/ActionNoiseL2Loss=0.1918 + throughput/total_tokens=176,064,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=918/500000] + train/ActionNoiseL2Loss=0.1279 + throughput/total_tokens=176,256,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=919/500000] + train/ActionNoiseL2Loss=0.1841 + throughput/total_tokens=176,448,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=920/500000] + optim/total_grad_norm=7.307 + train/ActionNoiseL2Loss=0.2208 + throughput/total_tokens=176,640,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=921/500000] + train/ActionNoiseL2Loss=0.1809 + throughput/total_tokens=176,832,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=922/500000] + train/ActionNoiseL2Loss=0.1312 + throughput/total_tokens=177,024,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=923/500000] + train/ActionNoiseL2Loss=0.1768 + throughput/total_tokens=177,216,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=924/500000] + train/ActionNoiseL2Loss=0.1269 + throughput/total_tokens=177,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=925/500000] + train/ActionNoiseL2Loss=0.2177 + throughput/total_tokens=177,600,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=926/500000] + train/ActionNoiseL2Loss=0.1832 + throughput/total_tokens=177,792,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=927/500000] + train/ActionNoiseL2Loss=0.1696 + throughput/total_tokens=177,984,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=928/500000] + train/ActionNoiseL2Loss=0.1421 + throughput/total_tokens=178,176,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=929/500000] + train/ActionNoiseL2Loss=0.2197 + throughput/total_tokens=178,368,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=930/500000] + train/ActionNoiseL2Loss=0.2285 + throughput/total_tokens=178,560,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=931/500000] + train/ActionNoiseL2Loss=0.2792 + throughput/total_tokens=178,752,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=932/500000] + train/ActionNoiseL2Loss=0.1670 + throughput/total_tokens=178,944,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=933/500000] + train/ActionNoiseL2Loss=0.2479 + throughput/total_tokens=179,136,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=934/500000] + train/ActionNoiseL2Loss=0.1820 + throughput/total_tokens=179,328,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=935/500000] + train/ActionNoiseL2Loss=0.1644 + throughput/total_tokens=179,520,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=936/500000] + train/ActionNoiseL2Loss=0.1693 + throughput/total_tokens=179,712,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=937/500000] + train/ActionNoiseL2Loss=0.1145 + throughput/total_tokens=179,904,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=938/500000] + train/ActionNoiseL2Loss=0.1510 + throughput/total_tokens=180,096,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=939/500000] + train/ActionNoiseL2Loss=0.1736 + throughput/total_tokens=180,288,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=940/500000] + optim/total_grad_norm=6.781 + train/ActionNoiseL2Loss=0.2180 + throughput/total_tokens=180,480,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=941/500000] + train/ActionNoiseL2Loss=0.1682 + throughput/total_tokens=180,672,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=942/500000] + train/ActionNoiseL2Loss=0.3380 + throughput/total_tokens=180,864,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=943/500000] + train/ActionNoiseL2Loss=0.2170 + throughput/total_tokens=181,056,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=944/500000] + train/ActionNoiseL2Loss=0.1963 + throughput/total_tokens=181,248,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=945/500000] + train/ActionNoiseL2Loss=0.1181 + throughput/total_tokens=181,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=946/500000] + train/ActionNoiseL2Loss=0.1716 + throughput/total_tokens=181,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=947/500000] + train/ActionNoiseL2Loss=0.1296 + throughput/total_tokens=181,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=948/500000] + train/ActionNoiseL2Loss=0.2257 + throughput/total_tokens=182,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=949/500000] + train/ActionNoiseL2Loss=0.1774 + throughput/total_tokens=182,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=950/500000] + train/ActionNoiseL2Loss=0.2323 + throughput/total_tokens=182,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=951/500000] + train/ActionNoiseL2Loss=0.1878 + throughput/total_tokens=182,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=952/500000] + train/ActionNoiseL2Loss=0.1214 + throughput/total_tokens=182,784,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=953/500000] + train/ActionNoiseL2Loss=0.1233 + throughput/total_tokens=182,976,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=954/500000] + train/ActionNoiseL2Loss=0.1751 + throughput/total_tokens=183,168,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=955/500000] + train/ActionNoiseL2Loss=0.1530 + throughput/total_tokens=183,360,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=956/500000] + train/ActionNoiseL2Loss=0.2305 + throughput/total_tokens=183,552,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=957/500000] + train/ActionNoiseL2Loss=0.2184 + throughput/total_tokens=183,744,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=958/500000] + train/ActionNoiseL2Loss=0.2270 + throughput/total_tokens=183,936,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=959/500000] + train/ActionNoiseL2Loss=0.0951 + throughput/total_tokens=184,128,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=960/500000] + optim/total_grad_norm=5.705 + train/ActionNoiseL2Loss=0.1425 + throughput/total_tokens=184,320,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=961/500000] + train/ActionNoiseL2Loss=0.1787 + throughput/total_tokens=184,512,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=962/500000] + train/ActionNoiseL2Loss=0.1251 + throughput/total_tokens=184,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=963/500000] + train/ActionNoiseL2Loss=0.1122 + throughput/total_tokens=184,896,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=964/500000] + train/ActionNoiseL2Loss=0.1813 + throughput/total_tokens=185,088,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=965/500000] + train/ActionNoiseL2Loss=0.1918 + throughput/total_tokens=185,280,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=966/500000] + train/ActionNoiseL2Loss=0.1216 + throughput/total_tokens=185,472,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=967/500000] + train/ActionNoiseL2Loss=0.2001 + throughput/total_tokens=185,664,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=968/500000] + train/ActionNoiseL2Loss=0.1845 + throughput/total_tokens=185,856,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=969/500000] + train/ActionNoiseL2Loss=0.1627 + throughput/total_tokens=186,048,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=970/500000] + train/ActionNoiseL2Loss=0.2253 + throughput/total_tokens=186,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=971/500000] + train/ActionNoiseL2Loss=0.1745 + throughput/total_tokens=186,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=972/500000] + train/ActionNoiseL2Loss=0.1820 + throughput/total_tokens=186,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=973/500000] + train/ActionNoiseL2Loss=0.1542 + throughput/total_tokens=186,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=974/500000] + train/ActionNoiseL2Loss=0.2019 + throughput/total_tokens=187,008,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=975/500000] + train/ActionNoiseL2Loss=0.2255 + throughput/total_tokens=187,200,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=976/500000] + train/ActionNoiseL2Loss=0.1938 + throughput/total_tokens=187,392,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=977/500000] + train/ActionNoiseL2Loss=0.1761 + throughput/total_tokens=187,584,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=978/500000] + train/ActionNoiseL2Loss=0.2520 + throughput/total_tokens=187,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=979/500000] + train/ActionNoiseL2Loss=0.1525 + throughput/total_tokens=187,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=980/500000] + optim/total_grad_norm=4.831 + train/ActionNoiseL2Loss=0.1693 + throughput/total_tokens=188,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=981/500000] + train/ActionNoiseL2Loss=0.2220 + throughput/total_tokens=188,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=982/500000] + train/ActionNoiseL2Loss=0.2075 + throughput/total_tokens=188,544,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=983/500000] + train/ActionNoiseL2Loss=0.1840 + throughput/total_tokens=188,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=984/500000] + train/ActionNoiseL2Loss=0.1600 + throughput/total_tokens=188,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=985/500000] + train/ActionNoiseL2Loss=0.1580 + throughput/total_tokens=189,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=986/500000] + train/ActionNoiseL2Loss=0.1629 + throughput/total_tokens=189,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=987/500000] + train/ActionNoiseL2Loss=0.1041 + throughput/total_tokens=189,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=988/500000] + train/ActionNoiseL2Loss=0.1969 + throughput/total_tokens=189,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=989/500000] + train/ActionNoiseL2Loss=0.2359 + throughput/total_tokens=189,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=990/500000] + train/ActionNoiseL2Loss=0.1522 + throughput/total_tokens=190,080,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=991/500000] + train/ActionNoiseL2Loss=0.1698 + throughput/total_tokens=190,272,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=992/500000] + train/ActionNoiseL2Loss=0.1503 + throughput/total_tokens=190,464,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=993/500000] + train/ActionNoiseL2Loss=0.1959 + throughput/total_tokens=190,656,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=994/500000] + train/ActionNoiseL2Loss=0.1948 + throughput/total_tokens=190,848,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=995/500000] + train/ActionNoiseL2Loss=0.1541 + throughput/total_tokens=191,040,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=996/500000] + train/ActionNoiseL2Loss=0.2892 + throughput/total_tokens=191,232,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=997/500000] + train/ActionNoiseL2Loss=0.1119 + throughput/total_tokens=191,424,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=998/500000] + train/ActionNoiseL2Loss=0.1691 + throughput/total_tokens=191,616,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=999/500000] + train/ActionNoiseL2Loss=0.1289 + throughput/total_tokens=191,808,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1000/500000] + optim/total_grad_norm=8.341 + train/ActionNoiseL2Loss=0.2613 + throughput/total_tokens=192,000,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +10/05 [22:34:02] INFO | >> Saving config... checkpoint.py:608 +10/05 [22:34:40] INFO | >> Saving model state... checkpoint.py:796 +10/05 [22:35:52] INFO | >> Saving optim state... checkpoint.py:811 +10/05 [22:37:23] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=1001/500000] + train/ActionNoiseL2Loss=0.2724 + throughput/total_tokens=192,192,000 + throughput/device/tokens_per_second=1,192 + throughput/device/batches_per_second=0.0497 +[step=1002/500000] + train/ActionNoiseL2Loss=0.1603 + throughput/total_tokens=192,384,000 + throughput/device/tokens_per_second=1,163 + throughput/device/batches_per_second=0.0485 +[step=1003/500000] + train/ActionNoiseL2Loss=0.1458 + throughput/total_tokens=192,576,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=1004/500000] + train/ActionNoiseL2Loss=0.1511 + throughput/total_tokens=192,768,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=1005/500000] + train/ActionNoiseL2Loss=0.1308 + throughput/total_tokens=192,960,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=1006/500000] + train/ActionNoiseL2Loss=0.1529 + throughput/total_tokens=193,152,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=1007/500000] + train/ActionNoiseL2Loss=0.1212 + throughput/total_tokens=193,344,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=1008/500000] + train/ActionNoiseL2Loss=0.1743 + throughput/total_tokens=193,536,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=1009/500000] + train/ActionNoiseL2Loss=0.1795 + throughput/total_tokens=193,728,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1010/500000] + train/ActionNoiseL2Loss=0.1357 + throughput/total_tokens=193,920,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1011/500000] + train/ActionNoiseL2Loss=0.1700 + throughput/total_tokens=194,112,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1012/500000] + train/ActionNoiseL2Loss=0.2107 + throughput/total_tokens=194,304,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1013/500000] + train/ActionNoiseL2Loss=0.1550 + throughput/total_tokens=194,496,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1014/500000] + train/ActionNoiseL2Loss=0.1500 + throughput/total_tokens=194,688,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1015/500000] + train/ActionNoiseL2Loss=0.1671 + throughput/total_tokens=194,880,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1016/500000] + train/ActionNoiseL2Loss=0.1563 + throughput/total_tokens=195,072,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1017/500000] + train/ActionNoiseL2Loss=0.1920 + throughput/total_tokens=195,264,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1018/500000] + train/ActionNoiseL2Loss=0.1514 + throughput/total_tokens=195,456,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1019/500000] + train/ActionNoiseL2Loss=0.1618 + throughput/total_tokens=195,648,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1020/500000] + optim/total_grad_norm=4.634 + train/ActionNoiseL2Loss=0.1418 + throughput/total_tokens=195,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=1021/500000] + train/ActionNoiseL2Loss=0.1490 + throughput/total_tokens=196,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1022/500000] + train/ActionNoiseL2Loss=0.0877 + throughput/total_tokens=196,224,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1023/500000] + train/ActionNoiseL2Loss=0.1278 + throughput/total_tokens=196,416,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1024/500000] + train/ActionNoiseL2Loss=0.1483 + throughput/total_tokens=196,608,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1025/500000] + train/ActionNoiseL2Loss=0.1450 + throughput/total_tokens=196,800,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1026/500000] + train/ActionNoiseL2Loss=0.1037 + throughput/total_tokens=196,992,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1027/500000] + train/ActionNoiseL2Loss=0.1009 + throughput/total_tokens=197,184,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1028/500000] + train/ActionNoiseL2Loss=0.1747 + throughput/total_tokens=197,376,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1029/500000] + train/ActionNoiseL2Loss=0.1194 + throughput/total_tokens=197,568,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1030/500000] + train/ActionNoiseL2Loss=0.1276 + throughput/total_tokens=197,760,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1031/500000] + train/ActionNoiseL2Loss=0.1370 + throughput/total_tokens=197,952,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1032/500000] + train/ActionNoiseL2Loss=0.1512 + throughput/total_tokens=198,144,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1033/500000] + train/ActionNoiseL2Loss=0.1564 + throughput/total_tokens=198,336,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1034/500000] + train/ActionNoiseL2Loss=0.1322 + throughput/total_tokens=198,528,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1035/500000] + train/ActionNoiseL2Loss=0.0904 + throughput/total_tokens=198,720,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1036/500000] + train/ActionNoiseL2Loss=0.1021 + throughput/total_tokens=198,912,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1037/500000] + train/ActionNoiseL2Loss=0.2363 + throughput/total_tokens=199,104,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1038/500000] + train/ActionNoiseL2Loss=0.1646 + throughput/total_tokens=199,296,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1039/500000] + train/ActionNoiseL2Loss=0.1281 + throughput/total_tokens=199,488,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1040/500000] + optim/total_grad_norm=8.575 + train/ActionNoiseL2Loss=0.2387 + throughput/total_tokens=199,680,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1041/500000] + train/ActionNoiseL2Loss=0.2021 + throughput/total_tokens=199,872,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1042/500000] + train/ActionNoiseL2Loss=0.1724 + throughput/total_tokens=200,064,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1043/500000] + train/ActionNoiseL2Loss=0.1636 + throughput/total_tokens=200,256,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1044/500000] + train/ActionNoiseL2Loss=0.1001 + throughput/total_tokens=200,448,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1045/500000] + train/ActionNoiseL2Loss=0.1094 + throughput/total_tokens=200,640,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1046/500000] + train/ActionNoiseL2Loss=0.0990 + throughput/total_tokens=200,832,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1047/500000] + train/ActionNoiseL2Loss=0.2229 + throughput/total_tokens=201,024,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1048/500000] + train/ActionNoiseL2Loss=0.1663 + throughput/total_tokens=201,216,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1049/500000] + train/ActionNoiseL2Loss=0.1448 + throughput/total_tokens=201,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1050/500000] + train/ActionNoiseL2Loss=0.1069 + throughput/total_tokens=201,600,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1051/500000] + train/ActionNoiseL2Loss=0.1222 + throughput/total_tokens=201,792,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1052/500000] + train/ActionNoiseL2Loss=0.0941 + throughput/total_tokens=201,984,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1053/500000] + train/ActionNoiseL2Loss=0.1092 + throughput/total_tokens=202,176,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1054/500000] + train/ActionNoiseL2Loss=0.1508 + throughput/total_tokens=202,368,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1055/500000] + train/ActionNoiseL2Loss=0.0934 + throughput/total_tokens=202,560,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1056/500000] + train/ActionNoiseL2Loss=0.1979 + throughput/total_tokens=202,752,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1057/500000] + train/ActionNoiseL2Loss=0.2111 + throughput/total_tokens=202,944,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1058/500000] + train/ActionNoiseL2Loss=0.1449 + throughput/total_tokens=203,136,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1059/500000] + train/ActionNoiseL2Loss=0.2205 + throughput/total_tokens=203,328,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1060/500000] + optim/total_grad_norm=6.198 + train/ActionNoiseL2Loss=0.2225 + throughput/total_tokens=203,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=1061/500000] + train/ActionNoiseL2Loss=0.1780 + throughput/total_tokens=203,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1062/500000] + train/ActionNoiseL2Loss=0.2450 + throughput/total_tokens=203,904,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1063/500000] + train/ActionNoiseL2Loss=0.1281 + throughput/total_tokens=204,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1064/500000] + train/ActionNoiseL2Loss=0.1226 + throughput/total_tokens=204,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1065/500000] + train/ActionNoiseL2Loss=0.1008 + throughput/total_tokens=204,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1066/500000] + train/ActionNoiseL2Loss=0.1285 + throughput/total_tokens=204,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1067/500000] + train/ActionNoiseL2Loss=0.2627 + throughput/total_tokens=204,864,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1068/500000] + train/ActionNoiseL2Loss=0.1086 + throughput/total_tokens=205,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1069/500000] + train/ActionNoiseL2Loss=0.2403 + throughput/total_tokens=205,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1070/500000] + train/ActionNoiseL2Loss=0.1176 + throughput/total_tokens=205,440,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1071/500000] + train/ActionNoiseL2Loss=0.1927 + throughput/total_tokens=205,632,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1072/500000] + train/ActionNoiseL2Loss=0.1573 + throughput/total_tokens=205,824,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1073/500000] + train/ActionNoiseL2Loss=0.1247 + throughput/total_tokens=206,016,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1074/500000] + train/ActionNoiseL2Loss=0.1802 + throughput/total_tokens=206,208,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1075/500000] + train/ActionNoiseL2Loss=0.1799 + throughput/total_tokens=206,400,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1076/500000] + train/ActionNoiseL2Loss=0.1870 + throughput/total_tokens=206,592,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1077/500000] + train/ActionNoiseL2Loss=0.1094 + throughput/total_tokens=206,784,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1078/500000] + train/ActionNoiseL2Loss=0.0944 + throughput/total_tokens=206,976,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1079/500000] + train/ActionNoiseL2Loss=0.1502 + throughput/total_tokens=207,168,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1080/500000] + optim/total_grad_norm=5.358 + train/ActionNoiseL2Loss=0.1623 + throughput/total_tokens=207,360,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1081/500000] + train/ActionNoiseL2Loss=0.1408 + throughput/total_tokens=207,552,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1082/500000] + train/ActionNoiseL2Loss=0.2180 + throughput/total_tokens=207,744,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1083/500000] + train/ActionNoiseL2Loss=0.1478 + throughput/total_tokens=207,936,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1084/500000] + train/ActionNoiseL2Loss=0.2298 + throughput/total_tokens=208,128,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1085/500000] + train/ActionNoiseL2Loss=0.1491 + throughput/total_tokens=208,320,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1086/500000] + train/ActionNoiseL2Loss=0.1858 + throughput/total_tokens=208,512,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1087/500000] + train/ActionNoiseL2Loss=0.1264 + throughput/total_tokens=208,704,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1088/500000] + train/ActionNoiseL2Loss=0.1276 + throughput/total_tokens=208,896,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1089/500000] + train/ActionNoiseL2Loss=0.1670 + throughput/total_tokens=209,088,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1090/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=209,280,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1091/500000] + train/ActionNoiseL2Loss=0.1475 + throughput/total_tokens=209,472,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1092/500000] + train/ActionNoiseL2Loss=0.0945 + throughput/total_tokens=209,664,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1093/500000] + train/ActionNoiseL2Loss=0.1998 + throughput/total_tokens=209,856,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1094/500000] + train/ActionNoiseL2Loss=0.1803 + throughput/total_tokens=210,048,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1095/500000] + train/ActionNoiseL2Loss=0.1644 + throughput/total_tokens=210,240,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1096/500000] + train/ActionNoiseL2Loss=0.1201 + throughput/total_tokens=210,432,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1097/500000] + train/ActionNoiseL2Loss=0.1459 + throughput/total_tokens=210,624,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1098/500000] + train/ActionNoiseL2Loss=0.1141 + throughput/total_tokens=210,816,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1099/500000] + train/ActionNoiseL2Loss=0.1904 + throughput/total_tokens=211,008,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1100/500000] + optim/total_grad_norm=3.674 + train/ActionNoiseL2Loss=0.1137 + throughput/total_tokens=211,200,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1101/500000] + train/ActionNoiseL2Loss=0.2133 + throughput/total_tokens=211,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1102/500000] + train/ActionNoiseL2Loss=0.1179 + throughput/total_tokens=211,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1103/500000] + train/ActionNoiseL2Loss=0.2077 + throughput/total_tokens=211,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1104/500000] + train/ActionNoiseL2Loss=0.1161 + throughput/total_tokens=211,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1105/500000] + train/ActionNoiseL2Loss=0.1543 + throughput/total_tokens=212,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1106/500000] + train/ActionNoiseL2Loss=0.2834 + throughput/total_tokens=212,352,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1107/500000] + train/ActionNoiseL2Loss=0.1658 + throughput/total_tokens=212,544,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1108/500000] + train/ActionNoiseL2Loss=0.1192 + throughput/total_tokens=212,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1109/500000] + train/ActionNoiseL2Loss=0.1263 + throughput/total_tokens=212,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1110/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=213,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1111/500000] + train/ActionNoiseL2Loss=0.1285 + throughput/total_tokens=213,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1112/500000] + train/ActionNoiseL2Loss=0.1087 + throughput/total_tokens=213,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1113/500000] + train/ActionNoiseL2Loss=0.1582 + throughput/total_tokens=213,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1114/500000] + train/ActionNoiseL2Loss=0.1554 + throughput/total_tokens=213,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1115/500000] + train/ActionNoiseL2Loss=0.1823 + throughput/total_tokens=214,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1116/500000] + train/ActionNoiseL2Loss=0.2550 + throughput/total_tokens=214,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1117/500000] + train/ActionNoiseL2Loss=0.1088 + throughput/total_tokens=214,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1118/500000] + train/ActionNoiseL2Loss=0.1860 + throughput/total_tokens=214,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1119/500000] + train/ActionNoiseL2Loss=0.1109 + throughput/total_tokens=214,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1120/500000] + optim/total_grad_norm=3.678 + train/ActionNoiseL2Loss=0.1244 + throughput/total_tokens=215,040,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1121/500000] + train/ActionNoiseL2Loss=0.1433 + throughput/total_tokens=215,232,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1122/500000] + train/ActionNoiseL2Loss=0.1532 + throughput/total_tokens=215,424,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1123/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=215,616,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1124/500000] + train/ActionNoiseL2Loss=0.1728 + throughput/total_tokens=215,808,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1125/500000] + train/ActionNoiseL2Loss=0.1072 + throughput/total_tokens=216,000,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1126/500000] + train/ActionNoiseL2Loss=0.0989 + throughput/total_tokens=216,192,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1127/500000] + train/ActionNoiseL2Loss=0.1279 + throughput/total_tokens=216,384,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1128/500000] + train/ActionNoiseL2Loss=0.1015 + throughput/total_tokens=216,576,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1129/500000] + train/ActionNoiseL2Loss=0.1576 + throughput/total_tokens=216,768,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1130/500000] + train/ActionNoiseL2Loss=0.1475 + throughput/total_tokens=216,960,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1131/500000] + train/ActionNoiseL2Loss=0.1873 + throughput/total_tokens=217,152,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1132/500000] + train/ActionNoiseL2Loss=0.1085 + throughput/total_tokens=217,344,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1133/500000] + train/ActionNoiseL2Loss=0.1342 + throughput/total_tokens=217,536,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1134/500000] + train/ActionNoiseL2Loss=0.1650 + throughput/total_tokens=217,728,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1135/500000] + train/ActionNoiseL2Loss=0.1537 + throughput/total_tokens=217,920,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1136/500000] + train/ActionNoiseL2Loss=0.1279 + throughput/total_tokens=218,112,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1137/500000] + train/ActionNoiseL2Loss=0.1267 + throughput/total_tokens=218,304,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1138/500000] + train/ActionNoiseL2Loss=0.1258 + throughput/total_tokens=218,496,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1139/500000] + train/ActionNoiseL2Loss=0.1199 + throughput/total_tokens=218,688,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1140/500000] + optim/total_grad_norm=8.607 + train/ActionNoiseL2Loss=0.2503 + throughput/total_tokens=218,880,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1141/500000] + train/ActionNoiseL2Loss=0.3595 + throughput/total_tokens=219,072,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1142/500000] + train/ActionNoiseL2Loss=0.1599 + throughput/total_tokens=219,264,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1143/500000] + train/ActionNoiseL2Loss=0.1873 + throughput/total_tokens=219,456,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1144/500000] + train/ActionNoiseL2Loss=0.1627 + throughput/total_tokens=219,648,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1145/500000] + train/ActionNoiseL2Loss=0.2538 + throughput/total_tokens=219,840,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1146/500000] + train/ActionNoiseL2Loss=0.2434 + throughput/total_tokens=220,032,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1147/500000] + train/ActionNoiseL2Loss=0.2710 + throughput/total_tokens=220,224,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1148/500000] + train/ActionNoiseL2Loss=0.1795 + throughput/total_tokens=220,416,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1149/500000] + train/ActionNoiseL2Loss=0.2804 + throughput/total_tokens=220,608,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1150/500000] + train/ActionNoiseL2Loss=0.1387 + throughput/total_tokens=220,800,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1151/500000] + train/ActionNoiseL2Loss=0.1424 + throughput/total_tokens=220,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1152/500000] + train/ActionNoiseL2Loss=0.1204 + throughput/total_tokens=221,184,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1153/500000] + train/ActionNoiseL2Loss=0.1889 + throughput/total_tokens=221,376,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1154/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=221,568,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1155/500000] + train/ActionNoiseL2Loss=0.1972 + throughput/total_tokens=221,760,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1156/500000] + train/ActionNoiseL2Loss=0.3051 + throughput/total_tokens=221,952,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1157/500000] + train/ActionNoiseL2Loss=0.2447 + throughput/total_tokens=222,144,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1158/500000] + train/ActionNoiseL2Loss=0.0931 + throughput/total_tokens=222,336,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1159/500000] + train/ActionNoiseL2Loss=0.1436 + throughput/total_tokens=222,528,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1160/500000] + optim/total_grad_norm=3.518 + train/ActionNoiseL2Loss=0.1279 + throughput/total_tokens=222,720,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1161/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=222,912,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1162/500000] + train/ActionNoiseL2Loss=0.2203 + throughput/total_tokens=223,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1163/500000] + train/ActionNoiseL2Loss=0.1277 + throughput/total_tokens=223,296,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1164/500000] + train/ActionNoiseL2Loss=0.1495 + throughput/total_tokens=223,488,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1165/500000] + train/ActionNoiseL2Loss=0.1587 + throughput/total_tokens=223,680,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1166/500000] + train/ActionNoiseL2Loss=0.1362 + throughput/total_tokens=223,872,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1167/500000] + train/ActionNoiseL2Loss=0.2584 + throughput/total_tokens=224,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1168/500000] + train/ActionNoiseL2Loss=0.1024 + throughput/total_tokens=224,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1169/500000] + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=224,448,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1170/500000] + train/ActionNoiseL2Loss=0.1362 + throughput/total_tokens=224,640,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1171/500000] + train/ActionNoiseL2Loss=0.3807 + throughput/total_tokens=224,832,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1172/500000] + train/ActionNoiseL2Loss=0.1798 + throughput/total_tokens=225,024,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1173/500000] + train/ActionNoiseL2Loss=0.1496 + throughput/total_tokens=225,216,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1174/500000] + train/ActionNoiseL2Loss=0.2634 + throughput/total_tokens=225,408,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1175/500000] + train/ActionNoiseL2Loss=0.1616 + throughput/total_tokens=225,600,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1176/500000] + train/ActionNoiseL2Loss=0.1568 + throughput/total_tokens=225,792,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1177/500000] + train/ActionNoiseL2Loss=0.1488 + throughput/total_tokens=225,984,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1178/500000] + train/ActionNoiseL2Loss=0.1928 + throughput/total_tokens=226,176,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1179/500000] + train/ActionNoiseL2Loss=0.1651 + throughput/total_tokens=226,368,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1180/500000] + optim/total_grad_norm=4.389 + train/ActionNoiseL2Loss=0.1161 + throughput/total_tokens=226,560,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1181/500000] + train/ActionNoiseL2Loss=0.1441 + throughput/total_tokens=226,752,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1182/500000] + train/ActionNoiseL2Loss=0.1420 + throughput/total_tokens=226,944,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1183/500000] + train/ActionNoiseL2Loss=0.1521 + throughput/total_tokens=227,136,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1184/500000] + train/ActionNoiseL2Loss=0.1719 + throughput/total_tokens=227,328,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1185/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=227,520,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1186/500000] + train/ActionNoiseL2Loss=0.2668 + throughput/total_tokens=227,712,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1187/500000] + train/ActionNoiseL2Loss=0.1940 + throughput/total_tokens=227,904,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1188/500000] + train/ActionNoiseL2Loss=0.2347 + throughput/total_tokens=228,096,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1189/500000] + train/ActionNoiseL2Loss=0.1930 + throughput/total_tokens=228,288,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1190/500000] + train/ActionNoiseL2Loss=0.1035 + throughput/total_tokens=228,480,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1191/500000] + train/ActionNoiseL2Loss=0.2170 + throughput/total_tokens=228,672,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1192/500000] + train/ActionNoiseL2Loss=0.1072 + throughput/total_tokens=228,864,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1193/500000] + train/ActionNoiseL2Loss=0.1205 + throughput/total_tokens=229,056,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1194/500000] + train/ActionNoiseL2Loss=0.1564 + throughput/total_tokens=229,248,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1195/500000] + train/ActionNoiseL2Loss=0.0907 + throughput/total_tokens=229,440,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1196/500000] + train/ActionNoiseL2Loss=0.1686 + throughput/total_tokens=229,632,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1197/500000] + train/ActionNoiseL2Loss=0.1393 + throughput/total_tokens=229,824,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1198/500000] + train/ActionNoiseL2Loss=0.1481 + throughput/total_tokens=230,016,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1199/500000] + train/ActionNoiseL2Loss=0.1435 + throughput/total_tokens=230,208,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1200/500000] + optim/total_grad_norm=4.427 + train/ActionNoiseL2Loss=0.1014 + throughput/total_tokens=230,400,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1201/500000] + train/ActionNoiseL2Loss=0.1352 + throughput/total_tokens=230,592,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1202/500000] + train/ActionNoiseL2Loss=0.0923 + throughput/total_tokens=230,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1203/500000] + train/ActionNoiseL2Loss=0.1027 + throughput/total_tokens=230,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1204/500000] + train/ActionNoiseL2Loss=0.1430 + throughput/total_tokens=231,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1205/500000] + train/ActionNoiseL2Loss=0.1100 + throughput/total_tokens=231,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1206/500000] + train/ActionNoiseL2Loss=0.1931 + throughput/total_tokens=231,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1207/500000] + train/ActionNoiseL2Loss=0.1443 + throughput/total_tokens=231,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1208/500000] + train/ActionNoiseL2Loss=0.1500 + throughput/total_tokens=231,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1209/500000] + train/ActionNoiseL2Loss=0.1504 + throughput/total_tokens=232,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1210/500000] + train/ActionNoiseL2Loss=0.1099 + throughput/total_tokens=232,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=1211/500000] + train/ActionNoiseL2Loss=0.2442 + throughput/total_tokens=232,512,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1212/500000] + train/ActionNoiseL2Loss=0.1275 + throughput/total_tokens=232,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1213/500000] + train/ActionNoiseL2Loss=0.2062 + throughput/total_tokens=232,896,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1214/500000] + train/ActionNoiseL2Loss=0.0911 + throughput/total_tokens=233,088,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1215/500000] + train/ActionNoiseL2Loss=0.1488 + throughput/total_tokens=233,280,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1216/500000] + train/ActionNoiseL2Loss=0.1904 + throughput/total_tokens=233,472,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1217/500000] + train/ActionNoiseL2Loss=0.1182 + throughput/total_tokens=233,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1218/500000] + train/ActionNoiseL2Loss=0.2139 + throughput/total_tokens=233,856,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1219/500000] + train/ActionNoiseL2Loss=0.1319 + throughput/total_tokens=234,048,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1220/500000] + optim/total_grad_norm=3.039 + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=234,240,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1221/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=234,432,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1222/500000] + train/ActionNoiseL2Loss=0.2443 + throughput/total_tokens=234,624,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1223/500000] + train/ActionNoiseL2Loss=0.1550 + throughput/total_tokens=234,816,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1224/500000] + train/ActionNoiseL2Loss=0.1381 + throughput/total_tokens=235,008,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1225/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=235,200,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1226/500000] + train/ActionNoiseL2Loss=0.0922 + throughput/total_tokens=235,392,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1227/500000] + train/ActionNoiseL2Loss=0.1930 + throughput/total_tokens=235,584,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1228/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=235,776,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1229/500000] + train/ActionNoiseL2Loss=0.0940 + throughput/total_tokens=235,968,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1230/500000] + train/ActionNoiseL2Loss=0.1365 + throughput/total_tokens=236,160,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1231/500000] + train/ActionNoiseL2Loss=0.1758 + throughput/total_tokens=236,352,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1232/500000] + train/ActionNoiseL2Loss=0.2228 + throughput/total_tokens=236,544,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1233/500000] + train/ActionNoiseL2Loss=0.1409 + throughput/total_tokens=236,736,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1234/500000] + train/ActionNoiseL2Loss=0.3125 + throughput/total_tokens=236,928,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1235/500000] + train/ActionNoiseL2Loss=0.2087 + throughput/total_tokens=237,120,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1236/500000] + train/ActionNoiseL2Loss=0.2156 + throughput/total_tokens=237,312,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1237/500000] + train/ActionNoiseL2Loss=0.0979 + throughput/total_tokens=237,504,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1238/500000] + train/ActionNoiseL2Loss=0.1992 + throughput/total_tokens=237,696,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1239/500000] + train/ActionNoiseL2Loss=0.1313 + throughput/total_tokens=237,888,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1240/500000] + optim/total_grad_norm=4.838 + train/ActionNoiseL2Loss=0.1441 + throughput/total_tokens=238,080,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1241/500000] + train/ActionNoiseL2Loss=0.1260 + throughput/total_tokens=238,272,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1242/500000] + train/ActionNoiseL2Loss=0.1052 + throughput/total_tokens=238,464,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1243/500000] + train/ActionNoiseL2Loss=0.2489 + throughput/total_tokens=238,656,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1244/500000] + train/ActionNoiseL2Loss=0.2173 + throughput/total_tokens=238,848,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1245/500000] + train/ActionNoiseL2Loss=0.1720 + throughput/total_tokens=239,040,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1246/500000] + train/ActionNoiseL2Loss=0.1926 + throughput/total_tokens=239,232,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1247/500000] + train/ActionNoiseL2Loss=0.1558 + throughput/total_tokens=239,424,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1248/500000] + train/ActionNoiseL2Loss=0.1356 + throughput/total_tokens=239,616,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1249/500000] + train/ActionNoiseL2Loss=0.1538 + throughput/total_tokens=239,808,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1250/500000] + train/ActionNoiseL2Loss=0.1358 + throughput/total_tokens=240,000,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1251/500000] + train/ActionNoiseL2Loss=0.1716 + throughput/total_tokens=240,192,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1252/500000] + train/ActionNoiseL2Loss=0.1126 + throughput/total_tokens=240,384,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1253/500000] + train/ActionNoiseL2Loss=0.1813 + throughput/total_tokens=240,576,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1254/500000] + train/ActionNoiseL2Loss=0.1310 + throughput/total_tokens=240,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1255/500000] + train/ActionNoiseL2Loss=0.1491 + throughput/total_tokens=240,960,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1256/500000] + train/ActionNoiseL2Loss=0.1777 + throughput/total_tokens=241,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1257/500000] + train/ActionNoiseL2Loss=0.1190 + throughput/total_tokens=241,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1258/500000] + train/ActionNoiseL2Loss=0.1357 + throughput/total_tokens=241,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1259/500000] + train/ActionNoiseL2Loss=0.1435 + throughput/total_tokens=241,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1260/500000] + optim/total_grad_norm=4.680 + train/ActionNoiseL2Loss=0.1261 + throughput/total_tokens=241,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=1261/500000] + train/ActionNoiseL2Loss=0.1528 + throughput/total_tokens=242,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1262/500000] + train/ActionNoiseL2Loss=0.2159 + throughput/total_tokens=242,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1263/500000] + train/ActionNoiseL2Loss=0.1482 + throughput/total_tokens=242,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1264/500000] + train/ActionNoiseL2Loss=0.0900 + throughput/total_tokens=242,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1265/500000] + train/ActionNoiseL2Loss=0.1288 + throughput/total_tokens=242,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1266/500000] + train/ActionNoiseL2Loss=0.1168 + throughput/total_tokens=243,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1267/500000] + train/ActionNoiseL2Loss=0.1055 + throughput/total_tokens=243,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1268/500000] + train/ActionNoiseL2Loss=0.1286 + throughput/total_tokens=243,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1269/500000] + train/ActionNoiseL2Loss=0.1482 + throughput/total_tokens=243,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1270/500000] + train/ActionNoiseL2Loss=0.1663 + throughput/total_tokens=243,840,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1271/500000] + train/ActionNoiseL2Loss=0.1146 + throughput/total_tokens=244,032,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1272/500000] + train/ActionNoiseL2Loss=0.0997 + throughput/total_tokens=244,224,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1273/500000] + train/ActionNoiseL2Loss=0.1210 + throughput/total_tokens=244,416,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1274/500000] + train/ActionNoiseL2Loss=0.1406 + throughput/total_tokens=244,608,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1275/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=244,800,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1276/500000] + train/ActionNoiseL2Loss=0.1651 + throughput/total_tokens=244,992,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1277/500000] + train/ActionNoiseL2Loss=0.1009 + throughput/total_tokens=245,184,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1278/500000] + train/ActionNoiseL2Loss=0.1068 + throughput/total_tokens=245,376,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1279/500000] + train/ActionNoiseL2Loss=0.1701 + throughput/total_tokens=245,568,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1280/500000] + optim/total_grad_norm=3.995 + train/ActionNoiseL2Loss=0.1196 + throughput/total_tokens=245,760,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1281/500000] + train/ActionNoiseL2Loss=0.0962 + throughput/total_tokens=245,952,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1282/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=246,144,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1283/500000] + train/ActionNoiseL2Loss=0.1091 + throughput/total_tokens=246,336,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1284/500000] + train/ActionNoiseL2Loss=0.1586 + throughput/total_tokens=246,528,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1285/500000] + train/ActionNoiseL2Loss=0.1308 + throughput/total_tokens=246,720,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1286/500000] + train/ActionNoiseL2Loss=0.1484 + throughput/total_tokens=246,912,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1287/500000] + train/ActionNoiseL2Loss=0.1181 + throughput/total_tokens=247,104,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1288/500000] + train/ActionNoiseL2Loss=0.0868 + throughput/total_tokens=247,296,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1289/500000] + train/ActionNoiseL2Loss=0.1568 + throughput/total_tokens=247,488,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1290/500000] + train/ActionNoiseL2Loss=0.1837 + throughput/total_tokens=247,680,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1291/500000] + train/ActionNoiseL2Loss=0.2733 + throughput/total_tokens=247,872,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1292/500000] + train/ActionNoiseL2Loss=0.1537 + throughput/total_tokens=248,064,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1293/500000] + train/ActionNoiseL2Loss=0.3044 + throughput/total_tokens=248,256,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1294/500000] + train/ActionNoiseL2Loss=0.1437 + throughput/total_tokens=248,448,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1295/500000] + train/ActionNoiseL2Loss=0.1438 + throughput/total_tokens=248,640,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1296/500000] + train/ActionNoiseL2Loss=0.2396 + throughput/total_tokens=248,832,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1297/500000] + train/ActionNoiseL2Loss=0.1547 + throughput/total_tokens=249,024,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1298/500000] + train/ActionNoiseL2Loss=0.2449 + throughput/total_tokens=249,216,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1299/500000] + train/ActionNoiseL2Loss=0.1515 + throughput/total_tokens=249,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1300/500000] + optim/total_grad_norm=4.408 + train/ActionNoiseL2Loss=0.1253 + throughput/total_tokens=249,600,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1301/500000] + train/ActionNoiseL2Loss=0.1422 + throughput/total_tokens=249,792,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1302/500000] + train/ActionNoiseL2Loss=0.1289 + throughput/total_tokens=249,984,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1303/500000] + train/ActionNoiseL2Loss=0.1338 + throughput/total_tokens=250,176,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1304/500000] + train/ActionNoiseL2Loss=0.1526 + throughput/total_tokens=250,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1305/500000] + train/ActionNoiseL2Loss=0.1229 + throughput/total_tokens=250,560,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1306/500000] + train/ActionNoiseL2Loss=0.1391 + throughput/total_tokens=250,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1307/500000] + train/ActionNoiseL2Loss=0.1536 + throughput/total_tokens=250,944,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1308/500000] + train/ActionNoiseL2Loss=0.1289 + throughput/total_tokens=251,136,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1309/500000] + train/ActionNoiseL2Loss=0.1570 + throughput/total_tokens=251,328,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1310/500000] + train/ActionNoiseL2Loss=0.1485 + throughput/total_tokens=251,520,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1311/500000] + train/ActionNoiseL2Loss=0.1584 + throughput/total_tokens=251,712,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1312/500000] + train/ActionNoiseL2Loss=0.2006 + throughput/total_tokens=251,904,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1313/500000] + train/ActionNoiseL2Loss=0.1734 + throughput/total_tokens=252,096,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1314/500000] + train/ActionNoiseL2Loss=0.0980 + throughput/total_tokens=252,288,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1315/500000] + train/ActionNoiseL2Loss=0.1813 + throughput/total_tokens=252,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1316/500000] + train/ActionNoiseL2Loss=0.1549 + throughput/total_tokens=252,672,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1317/500000] + train/ActionNoiseL2Loss=0.1583 + throughput/total_tokens=252,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1318/500000] + train/ActionNoiseL2Loss=0.1498 + throughput/total_tokens=253,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1319/500000] + train/ActionNoiseL2Loss=0.1623 + throughput/total_tokens=253,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1320/500000] + optim/total_grad_norm=5.627 + train/ActionNoiseL2Loss=0.1889 + throughput/total_tokens=253,440,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1321/500000] + train/ActionNoiseL2Loss=0.2255 + throughput/total_tokens=253,632,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1322/500000] + train/ActionNoiseL2Loss=0.0849 + throughput/total_tokens=253,824,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1323/500000] + train/ActionNoiseL2Loss=0.1136 + throughput/total_tokens=254,016,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1324/500000] + train/ActionNoiseL2Loss=0.0997 + throughput/total_tokens=254,208,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1325/500000] + train/ActionNoiseL2Loss=0.1928 + throughput/total_tokens=254,400,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1326/500000] + train/ActionNoiseL2Loss=0.0867 + throughput/total_tokens=254,592,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1327/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=254,784,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1328/500000] + train/ActionNoiseL2Loss=0.0925 + throughput/total_tokens=254,976,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1329/500000] + train/ActionNoiseL2Loss=0.1302 + throughput/total_tokens=255,168,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1330/500000] + train/ActionNoiseL2Loss=0.0967 + throughput/total_tokens=255,360,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1331/500000] + train/ActionNoiseL2Loss=0.1725 + throughput/total_tokens=255,552,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1332/500000] + train/ActionNoiseL2Loss=0.1767 + throughput/total_tokens=255,744,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1333/500000] + train/ActionNoiseL2Loss=0.1397 + throughput/total_tokens=255,936,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1334/500000] + train/ActionNoiseL2Loss=0.1809 + throughput/total_tokens=256,128,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1335/500000] + train/ActionNoiseL2Loss=0.2044 + throughput/total_tokens=256,320,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1336/500000] + train/ActionNoiseL2Loss=0.1601 + throughput/total_tokens=256,512,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1337/500000] + train/ActionNoiseL2Loss=0.1160 + throughput/total_tokens=256,704,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1338/500000] + train/ActionNoiseL2Loss=0.1498 + throughput/total_tokens=256,896,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1339/500000] + train/ActionNoiseL2Loss=0.1291 + throughput/total_tokens=257,088,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1340/500000] + optim/total_grad_norm=4.772 + train/ActionNoiseL2Loss=0.1175 + throughput/total_tokens=257,280,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1341/500000] + train/ActionNoiseL2Loss=0.1585 + throughput/total_tokens=257,472,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1342/500000] + train/ActionNoiseL2Loss=0.1245 + throughput/total_tokens=257,664,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1343/500000] + train/ActionNoiseL2Loss=0.0958 + throughput/total_tokens=257,856,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1344/500000] + train/ActionNoiseL2Loss=0.1845 + throughput/total_tokens=258,048,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1345/500000] + train/ActionNoiseL2Loss=0.1305 + throughput/total_tokens=258,240,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1346/500000] + train/ActionNoiseL2Loss=0.1273 + throughput/total_tokens=258,432,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1347/500000] + train/ActionNoiseL2Loss=0.1087 + throughput/total_tokens=258,624,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1348/500000] + train/ActionNoiseL2Loss=0.2979 + throughput/total_tokens=258,816,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1349/500000] + train/ActionNoiseL2Loss=0.1713 + throughput/total_tokens=259,008,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1350/500000] + train/ActionNoiseL2Loss=0.1623 + throughput/total_tokens=259,200,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1351/500000] + train/ActionNoiseL2Loss=0.1190 + throughput/total_tokens=259,392,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1352/500000] + train/ActionNoiseL2Loss=0.1253 + throughput/total_tokens=259,584,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1353/500000] + train/ActionNoiseL2Loss=0.1718 + throughput/total_tokens=259,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1354/500000] + train/ActionNoiseL2Loss=0.2205 + throughput/total_tokens=259,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1355/500000] + train/ActionNoiseL2Loss=0.1339 + throughput/total_tokens=260,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1356/500000] + train/ActionNoiseL2Loss=0.1080 + throughput/total_tokens=260,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1357/500000] + train/ActionNoiseL2Loss=0.1060 + throughput/total_tokens=260,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1358/500000] + train/ActionNoiseL2Loss=0.1931 + throughput/total_tokens=260,736,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1359/500000] + train/ActionNoiseL2Loss=0.1480 + throughput/total_tokens=260,928,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1360/500000] + optim/total_grad_norm=5.722 + train/ActionNoiseL2Loss=0.1342 + throughput/total_tokens=261,120,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=1361/500000] + train/ActionNoiseL2Loss=0.0966 + throughput/total_tokens=261,312,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1362/500000] + train/ActionNoiseL2Loss=0.1856 + throughput/total_tokens=261,504,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1363/500000] + train/ActionNoiseL2Loss=0.1232 + throughput/total_tokens=261,696,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1364/500000] + train/ActionNoiseL2Loss=0.1508 + throughput/total_tokens=261,888,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1365/500000] + train/ActionNoiseL2Loss=0.1124 + throughput/total_tokens=262,080,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1366/500000] + train/ActionNoiseL2Loss=0.2207 + throughput/total_tokens=262,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1367/500000] + train/ActionNoiseL2Loss=0.1708 + throughput/total_tokens=262,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1368/500000] + train/ActionNoiseL2Loss=0.1289 + throughput/total_tokens=262,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1369/500000] + train/ActionNoiseL2Loss=0.1160 + throughput/total_tokens=262,848,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1370/500000] + train/ActionNoiseL2Loss=0.2940 + throughput/total_tokens=263,040,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1371/500000] + train/ActionNoiseL2Loss=0.1533 + throughput/total_tokens=263,232,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1372/500000] + train/ActionNoiseL2Loss=0.2754 + throughput/total_tokens=263,424,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1373/500000] + train/ActionNoiseL2Loss=0.1562 + throughput/total_tokens=263,616,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1374/500000] + train/ActionNoiseL2Loss=0.1971 + throughput/total_tokens=263,808,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1375/500000] + train/ActionNoiseL2Loss=0.1294 + throughput/total_tokens=264,000,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1376/500000] + train/ActionNoiseL2Loss=0.1099 + throughput/total_tokens=264,192,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1377/500000] + train/ActionNoiseL2Loss=0.1111 + throughput/total_tokens=264,384,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1378/500000] + train/ActionNoiseL2Loss=0.1595 + throughput/total_tokens=264,576,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1379/500000] + train/ActionNoiseL2Loss=0.1512 + throughput/total_tokens=264,768,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1380/500000] + optim/total_grad_norm=4.847 + train/ActionNoiseL2Loss=0.1581 + throughput/total_tokens=264,960,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1381/500000] + train/ActionNoiseL2Loss=0.2007 + throughput/total_tokens=265,152,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1382/500000] + train/ActionNoiseL2Loss=0.3333 + throughput/total_tokens=265,344,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1383/500000] + train/ActionNoiseL2Loss=0.1025 + throughput/total_tokens=265,536,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1384/500000] + train/ActionNoiseL2Loss=0.1249 + throughput/total_tokens=265,728,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1385/500000] + train/ActionNoiseL2Loss=0.1824 + throughput/total_tokens=265,920,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1386/500000] + train/ActionNoiseL2Loss=0.1308 + throughput/total_tokens=266,112,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1387/500000] + train/ActionNoiseL2Loss=0.1929 + throughput/total_tokens=266,304,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1388/500000] + train/ActionNoiseL2Loss=0.2525 + throughput/total_tokens=266,496,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1389/500000] + train/ActionNoiseL2Loss=0.2298 + throughput/total_tokens=266,688,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1390/500000] + train/ActionNoiseL2Loss=0.1641 + throughput/total_tokens=266,880,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1391/500000] + train/ActionNoiseL2Loss=0.1495 + throughput/total_tokens=267,072,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1392/500000] + train/ActionNoiseL2Loss=0.1181 + throughput/total_tokens=267,264,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1393/500000] + train/ActionNoiseL2Loss=0.1634 + throughput/total_tokens=267,456,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1394/500000] + train/ActionNoiseL2Loss=0.1587 + throughput/total_tokens=267,648,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1395/500000] + train/ActionNoiseL2Loss=0.1494 + throughput/total_tokens=267,840,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1396/500000] + train/ActionNoiseL2Loss=0.1247 + throughput/total_tokens=268,032,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1397/500000] + train/ActionNoiseL2Loss=0.1156 + throughput/total_tokens=268,224,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1398/500000] + train/ActionNoiseL2Loss=0.1301 + throughput/total_tokens=268,416,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1399/500000] + train/ActionNoiseL2Loss=0.1847 + throughput/total_tokens=268,608,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1400/500000] + optim/total_grad_norm=3.607 + train/ActionNoiseL2Loss=0.1329 + throughput/total_tokens=268,800,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1401/500000] + train/ActionNoiseL2Loss=0.1450 + throughput/total_tokens=268,992,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1402/500000] + train/ActionNoiseL2Loss=0.1644 + throughput/total_tokens=269,184,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1403/500000] + train/ActionNoiseL2Loss=0.1117 + throughput/total_tokens=269,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1404/500000] + train/ActionNoiseL2Loss=0.2054 + throughput/total_tokens=269,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1405/500000] + train/ActionNoiseL2Loss=0.1437 + throughput/total_tokens=269,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1406/500000] + train/ActionNoiseL2Loss=0.1294 + throughput/total_tokens=269,952,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1407/500000] + train/ActionNoiseL2Loss=0.1005 + throughput/total_tokens=270,144,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1408/500000] + train/ActionNoiseL2Loss=0.1139 + throughput/total_tokens=270,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1409/500000] + train/ActionNoiseL2Loss=0.1165 + throughput/total_tokens=270,528,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1410/500000] + train/ActionNoiseL2Loss=0.1976 + throughput/total_tokens=270,720,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=1411/500000] + train/ActionNoiseL2Loss=0.1331 + throughput/total_tokens=270,912,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1412/500000] + train/ActionNoiseL2Loss=0.1241 + throughput/total_tokens=271,104,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1413/500000] + train/ActionNoiseL2Loss=0.2260 + throughput/total_tokens=271,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1414/500000] + train/ActionNoiseL2Loss=0.1117 + throughput/total_tokens=271,488,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1415/500000] + train/ActionNoiseL2Loss=0.1327 + throughput/total_tokens=271,680,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1416/500000] + train/ActionNoiseL2Loss=0.1409 + throughput/total_tokens=271,872,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1417/500000] + train/ActionNoiseL2Loss=0.1113 + throughput/total_tokens=272,064,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1418/500000] + train/ActionNoiseL2Loss=0.0859 + throughput/total_tokens=272,256,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1419/500000] + train/ActionNoiseL2Loss=0.2106 + throughput/total_tokens=272,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1420/500000] + optim/total_grad_norm=5.258 + train/ActionNoiseL2Loss=0.1878 + throughput/total_tokens=272,640,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1421/500000] + train/ActionNoiseL2Loss=0.1442 + throughput/total_tokens=272,832,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1422/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=273,024,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1423/500000] + train/ActionNoiseL2Loss=0.1385 + throughput/total_tokens=273,216,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1424/500000] + train/ActionNoiseL2Loss=0.2667 + throughput/total_tokens=273,408,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1425/500000] + train/ActionNoiseL2Loss=0.1999 + throughput/total_tokens=273,600,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1426/500000] + train/ActionNoiseL2Loss=0.1204 + throughput/total_tokens=273,792,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1427/500000] + train/ActionNoiseL2Loss=0.1243 + throughput/total_tokens=273,984,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1428/500000] + train/ActionNoiseL2Loss=0.1476 + throughput/total_tokens=274,176,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1429/500000] + train/ActionNoiseL2Loss=0.1661 + throughput/total_tokens=274,368,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1430/500000] + train/ActionNoiseL2Loss=0.1434 + throughput/total_tokens=274,560,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1431/500000] + train/ActionNoiseL2Loss=0.1558 + throughput/total_tokens=274,752,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1432/500000] + train/ActionNoiseL2Loss=0.1761 + throughput/total_tokens=274,944,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1433/500000] + train/ActionNoiseL2Loss=0.0997 + throughput/total_tokens=275,136,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1434/500000] + train/ActionNoiseL2Loss=0.1213 + throughput/total_tokens=275,328,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1435/500000] + train/ActionNoiseL2Loss=0.0949 + throughput/total_tokens=275,520,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1436/500000] + train/ActionNoiseL2Loss=0.1342 + throughput/total_tokens=275,712,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1437/500000] + train/ActionNoiseL2Loss=0.1642 + throughput/total_tokens=275,904,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1438/500000] + train/ActionNoiseL2Loss=0.0986 + throughput/total_tokens=276,096,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1439/500000] + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=276,288,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1440/500000] + optim/total_grad_norm=4.365 + train/ActionNoiseL2Loss=0.1242 + throughput/total_tokens=276,480,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1441/500000] + train/ActionNoiseL2Loss=0.1133 + throughput/total_tokens=276,672,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1442/500000] + train/ActionNoiseL2Loss=0.1424 + throughput/total_tokens=276,864,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1443/500000] + train/ActionNoiseL2Loss=0.0942 + throughput/total_tokens=277,056,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1444/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=277,248,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1445/500000] + train/ActionNoiseL2Loss=0.1227 + throughput/total_tokens=277,440,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1446/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=277,632,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1447/500000] + train/ActionNoiseL2Loss=0.1943 + throughput/total_tokens=277,824,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1448/500000] + train/ActionNoiseL2Loss=0.1051 + throughput/total_tokens=278,016,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1449/500000] + train/ActionNoiseL2Loss=0.1265 + throughput/total_tokens=278,208,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1450/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=278,400,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1451/500000] + train/ActionNoiseL2Loss=0.2100 + throughput/total_tokens=278,592,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1452/500000] + train/ActionNoiseL2Loss=0.1214 + throughput/total_tokens=278,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1453/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=278,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1454/500000] + train/ActionNoiseL2Loss=0.2375 + throughput/total_tokens=279,168,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1455/500000] + train/ActionNoiseL2Loss=0.1035 + throughput/total_tokens=279,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1456/500000] + train/ActionNoiseL2Loss=0.1700 + throughput/total_tokens=279,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1457/500000] + train/ActionNoiseL2Loss=0.1349 + throughput/total_tokens=279,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1458/500000] + train/ActionNoiseL2Loss=0.1364 + throughput/total_tokens=279,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1459/500000] + train/ActionNoiseL2Loss=0.1591 + throughput/total_tokens=280,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1460/500000] + optim/total_grad_norm=5.263 + train/ActionNoiseL2Loss=0.2284 + throughput/total_tokens=280,320,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=1461/500000] + train/ActionNoiseL2Loss=0.2685 + throughput/total_tokens=280,512,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1462/500000] + train/ActionNoiseL2Loss=0.1311 + throughput/total_tokens=280,704,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1463/500000] + train/ActionNoiseL2Loss=0.1525 + throughput/total_tokens=280,896,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1464/500000] + train/ActionNoiseL2Loss=0.1091 + throughput/total_tokens=281,088,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1465/500000] + train/ActionNoiseL2Loss=0.1422 + throughput/total_tokens=281,280,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1466/500000] + train/ActionNoiseL2Loss=0.0945 + throughput/total_tokens=281,472,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1467/500000] + train/ActionNoiseL2Loss=0.1212 + throughput/total_tokens=281,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1468/500000] + train/ActionNoiseL2Loss=0.0956 + throughput/total_tokens=281,856,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1469/500000] + train/ActionNoiseL2Loss=0.1713 + throughput/total_tokens=282,048,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1470/500000] + train/ActionNoiseL2Loss=0.1558 + throughput/total_tokens=282,240,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1471/500000] + train/ActionNoiseL2Loss=0.1142 + throughput/total_tokens=282,432,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1472/500000] + train/ActionNoiseL2Loss=0.0954 + throughput/total_tokens=282,624,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1473/500000] + train/ActionNoiseL2Loss=0.2211 + throughput/total_tokens=282,816,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1474/500000] + train/ActionNoiseL2Loss=0.1768 + throughput/total_tokens=283,008,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1475/500000] + train/ActionNoiseL2Loss=0.1084 + throughput/total_tokens=283,200,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1476/500000] + train/ActionNoiseL2Loss=0.1581 + throughput/total_tokens=283,392,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1477/500000] + train/ActionNoiseL2Loss=0.1886 + throughput/total_tokens=283,584,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1478/500000] + train/ActionNoiseL2Loss=0.1128 + throughput/total_tokens=283,776,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1479/500000] + train/ActionNoiseL2Loss=0.1112 + throughput/total_tokens=283,968,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1480/500000] + optim/total_grad_norm=3.512 + train/ActionNoiseL2Loss=0.1335 + throughput/total_tokens=284,160,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1481/500000] + train/ActionNoiseL2Loss=0.1895 + throughput/total_tokens=284,352,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1482/500000] + train/ActionNoiseL2Loss=0.1483 + throughput/total_tokens=284,544,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1483/500000] + train/ActionNoiseL2Loss=0.2039 + throughput/total_tokens=284,736,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1484/500000] + train/ActionNoiseL2Loss=0.1133 + throughput/total_tokens=284,928,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1485/500000] + train/ActionNoiseL2Loss=0.1564 + throughput/total_tokens=285,120,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1486/500000] + train/ActionNoiseL2Loss=0.1664 + throughput/total_tokens=285,312,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1487/500000] + train/ActionNoiseL2Loss=0.1362 + throughput/total_tokens=285,504,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1488/500000] + train/ActionNoiseL2Loss=0.1280 + throughput/total_tokens=285,696,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1489/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=285,888,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1490/500000] + train/ActionNoiseL2Loss=0.1532 + throughput/total_tokens=286,080,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1491/500000] + train/ActionNoiseL2Loss=0.1067 + throughput/total_tokens=286,272,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1492/500000] + train/ActionNoiseL2Loss=0.0893 + throughput/total_tokens=286,464,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1493/500000] + train/ActionNoiseL2Loss=0.1569 + throughput/total_tokens=286,656,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1494/500000] + train/ActionNoiseL2Loss=0.1261 + throughput/total_tokens=286,848,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1495/500000] + train/ActionNoiseL2Loss=0.1110 + throughput/total_tokens=287,040,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1496/500000] + train/ActionNoiseL2Loss=0.1465 + throughput/total_tokens=287,232,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1497/500000] + train/ActionNoiseL2Loss=0.1799 + throughput/total_tokens=287,424,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1498/500000] + train/ActionNoiseL2Loss=0.2420 + throughput/total_tokens=287,616,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1499/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=287,808,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1500/500000] + optim/total_grad_norm=3.570 + train/ActionNoiseL2Loss=0.1432 + throughput/total_tokens=288,000,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +10/06 [01:32:38] INFO | >> Saving config... checkpoint.py:608 +10/06 [01:33:25] INFO | >> Saving model state... checkpoint.py:796 +10/06 [01:34:36] INFO | >> Saving optim state... checkpoint.py:811 +10/06 [01:36:08] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=1501/500000] + train/ActionNoiseL2Loss=0.1448 + throughput/total_tokens=288,192,000 + throughput/device/tokens_per_second=1,197 + throughput/device/batches_per_second=0.0499 +[step=1502/500000] + train/ActionNoiseL2Loss=0.0962 + throughput/total_tokens=288,384,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=1503/500000] + train/ActionNoiseL2Loss=0.2216 + throughput/total_tokens=288,576,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=1504/500000] + train/ActionNoiseL2Loss=0.2147 + throughput/total_tokens=288,768,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=1505/500000] + train/ActionNoiseL2Loss=0.0940 + throughput/total_tokens=288,960,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1506/500000] + train/ActionNoiseL2Loss=0.2187 + throughput/total_tokens=289,152,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1507/500000] + train/ActionNoiseL2Loss=0.0946 + throughput/total_tokens=289,344,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1508/500000] + train/ActionNoiseL2Loss=0.1145 + throughput/total_tokens=289,536,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1509/500000] + train/ActionNoiseL2Loss=0.1428 + throughput/total_tokens=289,728,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1510/500000] + train/ActionNoiseL2Loss=0.2130 + throughput/total_tokens=289,920,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1511/500000] + train/ActionNoiseL2Loss=0.1264 + throughput/total_tokens=290,112,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1512/500000] + train/ActionNoiseL2Loss=0.1321 + throughput/total_tokens=290,304,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1513/500000] + train/ActionNoiseL2Loss=0.1059 + throughput/total_tokens=290,496,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1514/500000] + train/ActionNoiseL2Loss=0.0939 + throughput/total_tokens=290,688,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1515/500000] + train/ActionNoiseL2Loss=0.1974 + throughput/total_tokens=290,880,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1516/500000] + train/ActionNoiseL2Loss=0.1163 + throughput/total_tokens=291,072,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1517/500000] + train/ActionNoiseL2Loss=0.1256 + throughput/total_tokens=291,264,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1518/500000] + train/ActionNoiseL2Loss=0.1185 + throughput/total_tokens=291,456,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1519/500000] + train/ActionNoiseL2Loss=0.1745 + throughput/total_tokens=291,648,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1520/500000] + optim/total_grad_norm=4.309 + train/ActionNoiseL2Loss=0.1226 + throughput/total_tokens=291,840,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1521/500000] + train/ActionNoiseL2Loss=0.1687 + throughput/total_tokens=292,032,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1522/500000] + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=292,224,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1523/500000] + train/ActionNoiseL2Loss=0.1373 + throughput/total_tokens=292,416,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1524/500000] + train/ActionNoiseL2Loss=0.1548 + throughput/total_tokens=292,608,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1525/500000] + train/ActionNoiseL2Loss=0.1273 + throughput/total_tokens=292,800,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1526/500000] + train/ActionNoiseL2Loss=0.1856 + throughput/total_tokens=292,992,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1527/500000] + train/ActionNoiseL2Loss=0.1417 + throughput/total_tokens=293,184,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1528/500000] + train/ActionNoiseL2Loss=0.1158 + throughput/total_tokens=293,376,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1529/500000] + train/ActionNoiseL2Loss=0.1142 + throughput/total_tokens=293,568,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1530/500000] + train/ActionNoiseL2Loss=0.1213 + throughput/total_tokens=293,760,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1531/500000] + train/ActionNoiseL2Loss=0.1191 + throughput/total_tokens=293,952,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1532/500000] + train/ActionNoiseL2Loss=0.2396 + throughput/total_tokens=294,144,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1533/500000] + train/ActionNoiseL2Loss=0.2129 + throughput/total_tokens=294,336,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1534/500000] + train/ActionNoiseL2Loss=0.1661 + throughput/total_tokens=294,528,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1535/500000] + train/ActionNoiseL2Loss=0.1330 + throughput/total_tokens=294,720,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1536/500000] + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=294,912,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1537/500000] + train/ActionNoiseL2Loss=0.1026 + throughput/total_tokens=295,104,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1538/500000] + train/ActionNoiseL2Loss=0.2049 + throughput/total_tokens=295,296,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1539/500000] + train/ActionNoiseL2Loss=0.1465 + throughput/total_tokens=295,488,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1540/500000] + optim/total_grad_norm=2.970 + train/ActionNoiseL2Loss=0.0858 + throughput/total_tokens=295,680,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1541/500000] + train/ActionNoiseL2Loss=0.1045 + throughput/total_tokens=295,872,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1542/500000] + train/ActionNoiseL2Loss=0.1711 + throughput/total_tokens=296,064,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1543/500000] + train/ActionNoiseL2Loss=0.0925 + throughput/total_tokens=296,256,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1544/500000] + train/ActionNoiseL2Loss=0.1687 + throughput/total_tokens=296,448,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1545/500000] + train/ActionNoiseL2Loss=0.1821 + throughput/total_tokens=296,640,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1546/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=296,832,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1547/500000] + train/ActionNoiseL2Loss=0.1065 + throughput/total_tokens=297,024,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1548/500000] + train/ActionNoiseL2Loss=0.1689 + throughput/total_tokens=297,216,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1549/500000] + train/ActionNoiseL2Loss=0.1574 + throughput/total_tokens=297,408,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1550/500000] + train/ActionNoiseL2Loss=0.1000 + throughput/total_tokens=297,600,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1551/500000] + train/ActionNoiseL2Loss=0.1174 + throughput/total_tokens=297,792,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1552/500000] + train/ActionNoiseL2Loss=0.1665 + throughput/total_tokens=297,984,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1553/500000] + train/ActionNoiseL2Loss=0.1265 + throughput/total_tokens=298,176,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1554/500000] + train/ActionNoiseL2Loss=0.2397 + throughput/total_tokens=298,368,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1555/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=298,560,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1556/500000] + train/ActionNoiseL2Loss=0.1181 + throughput/total_tokens=298,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1557/500000] + train/ActionNoiseL2Loss=0.1331 + throughput/total_tokens=298,944,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1558/500000] + train/ActionNoiseL2Loss=0.1204 + throughput/total_tokens=299,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1559/500000] + train/ActionNoiseL2Loss=0.1276 + throughput/total_tokens=299,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1560/500000] + optim/total_grad_norm=2.798 + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=299,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=1561/500000] + train/ActionNoiseL2Loss=0.0863 + throughput/total_tokens=299,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1562/500000] + train/ActionNoiseL2Loss=0.1121 + throughput/total_tokens=299,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1563/500000] + train/ActionNoiseL2Loss=0.1039 + throughput/total_tokens=300,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1564/500000] + train/ActionNoiseL2Loss=0.1572 + throughput/total_tokens=300,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1565/500000] + train/ActionNoiseL2Loss=0.1417 + throughput/total_tokens=300,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1566/500000] + train/ActionNoiseL2Loss=0.1755 + throughput/total_tokens=300,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1567/500000] + train/ActionNoiseL2Loss=0.1063 + throughput/total_tokens=300,864,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1568/500000] + train/ActionNoiseL2Loss=0.1109 + throughput/total_tokens=301,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1569/500000] + train/ActionNoiseL2Loss=0.1954 + throughput/total_tokens=301,248,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1570/500000] + train/ActionNoiseL2Loss=0.2008 + throughput/total_tokens=301,440,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1571/500000] + train/ActionNoiseL2Loss=0.1441 + throughput/total_tokens=301,632,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1572/500000] + train/ActionNoiseL2Loss=0.1036 + throughput/total_tokens=301,824,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1573/500000] + train/ActionNoiseL2Loss=0.1257 + throughput/total_tokens=302,016,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1574/500000] + train/ActionNoiseL2Loss=0.1053 + throughput/total_tokens=302,208,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1575/500000] + train/ActionNoiseL2Loss=0.1258 + throughput/total_tokens=302,400,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1576/500000] + train/ActionNoiseL2Loss=0.1700 + throughput/total_tokens=302,592,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1577/500000] + train/ActionNoiseL2Loss=0.1714 + throughput/total_tokens=302,784,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1578/500000] + train/ActionNoiseL2Loss=0.0951 + throughput/total_tokens=302,976,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1579/500000] + train/ActionNoiseL2Loss=0.1895 + throughput/total_tokens=303,168,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1580/500000] + optim/total_grad_norm=3.429 + train/ActionNoiseL2Loss=0.1264 + throughput/total_tokens=303,360,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1581/500000] + train/ActionNoiseL2Loss=0.1357 + throughput/total_tokens=303,552,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1582/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=303,744,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1583/500000] + train/ActionNoiseL2Loss=0.1222 + throughput/total_tokens=303,936,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1584/500000] + train/ActionNoiseL2Loss=0.0934 + throughput/total_tokens=304,128,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1585/500000] + train/ActionNoiseL2Loss=0.1145 + throughput/total_tokens=304,320,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1586/500000] + train/ActionNoiseL2Loss=0.1896 + throughput/total_tokens=304,512,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1587/500000] + train/ActionNoiseL2Loss=0.1131 + throughput/total_tokens=304,704,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1588/500000] + train/ActionNoiseL2Loss=0.1469 + throughput/total_tokens=304,896,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1589/500000] + train/ActionNoiseL2Loss=0.1761 + throughput/total_tokens=305,088,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1590/500000] + train/ActionNoiseL2Loss=0.1803 + throughput/total_tokens=305,280,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1591/500000] + train/ActionNoiseL2Loss=0.1193 + throughput/total_tokens=305,472,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1592/500000] + train/ActionNoiseL2Loss=0.1462 + throughput/total_tokens=305,664,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1593/500000] + train/ActionNoiseL2Loss=0.1205 + throughput/total_tokens=305,856,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1594/500000] + train/ActionNoiseL2Loss=0.0878 + throughput/total_tokens=306,048,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1595/500000] + train/ActionNoiseL2Loss=0.1540 + throughput/total_tokens=306,240,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1596/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=306,432,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1597/500000] + train/ActionNoiseL2Loss=0.1799 + throughput/total_tokens=306,624,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1598/500000] + train/ActionNoiseL2Loss=0.1106 + throughput/total_tokens=306,816,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1599/500000] + train/ActionNoiseL2Loss=0.2148 + throughput/total_tokens=307,008,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1600/500000] + optim/total_grad_norm=4.506 + train/ActionNoiseL2Loss=0.1511 + throughput/total_tokens=307,200,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1601/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=307,392,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1602/500000] + train/ActionNoiseL2Loss=0.1395 + throughput/total_tokens=307,584,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1603/500000] + train/ActionNoiseL2Loss=0.1355 + throughput/total_tokens=307,776,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1604/500000] + train/ActionNoiseL2Loss=0.1248 + throughput/total_tokens=307,968,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1605/500000] + train/ActionNoiseL2Loss=0.1315 + throughput/total_tokens=308,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1606/500000] + train/ActionNoiseL2Loss=0.1403 + throughput/total_tokens=308,352,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1607/500000] + train/ActionNoiseL2Loss=0.1184 + throughput/total_tokens=308,544,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1608/500000] + train/ActionNoiseL2Loss=0.0920 + throughput/total_tokens=308,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1609/500000] + train/ActionNoiseL2Loss=0.1526 + throughput/total_tokens=308,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1610/500000] + train/ActionNoiseL2Loss=0.1050 + throughput/total_tokens=309,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1611/500000] + train/ActionNoiseL2Loss=0.0910 + throughput/total_tokens=309,312,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1612/500000] + train/ActionNoiseL2Loss=0.0977 + throughput/total_tokens=309,504,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1613/500000] + train/ActionNoiseL2Loss=0.1246 + throughput/total_tokens=309,696,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1614/500000] + train/ActionNoiseL2Loss=0.1385 + throughput/total_tokens=309,888,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1615/500000] + train/ActionNoiseL2Loss=0.1497 + throughput/total_tokens=310,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1616/500000] + train/ActionNoiseL2Loss=0.1028 + throughput/total_tokens=310,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1617/500000] + train/ActionNoiseL2Loss=0.1069 + throughput/total_tokens=310,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1618/500000] + train/ActionNoiseL2Loss=0.1347 + throughput/total_tokens=310,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1619/500000] + train/ActionNoiseL2Loss=0.1596 + throughput/total_tokens=310,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1620/500000] + optim/total_grad_norm=2.786 + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=311,040,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1621/500000] + train/ActionNoiseL2Loss=0.1989 + throughput/total_tokens=311,232,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1622/500000] + train/ActionNoiseL2Loss=0.1407 + throughput/total_tokens=311,424,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1623/500000] + train/ActionNoiseL2Loss=0.1124 + throughput/total_tokens=311,616,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1624/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=311,808,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1625/500000] + train/ActionNoiseL2Loss=0.1425 + throughput/total_tokens=312,000,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1626/500000] + train/ActionNoiseL2Loss=0.1095 + throughput/total_tokens=312,192,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1627/500000] + train/ActionNoiseL2Loss=0.1302 + throughput/total_tokens=312,384,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1628/500000] + train/ActionNoiseL2Loss=0.1940 + throughput/total_tokens=312,576,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1629/500000] + train/ActionNoiseL2Loss=0.0884 + throughput/total_tokens=312,768,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1630/500000] + train/ActionNoiseL2Loss=0.0928 + throughput/total_tokens=312,960,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1631/500000] + train/ActionNoiseL2Loss=0.0958 + throughput/total_tokens=313,152,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1632/500000] + train/ActionNoiseL2Loss=0.1158 + throughput/total_tokens=313,344,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1633/500000] + train/ActionNoiseL2Loss=0.1220 + throughput/total_tokens=313,536,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1634/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=313,728,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1635/500000] + train/ActionNoiseL2Loss=0.1906 + throughput/total_tokens=313,920,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1636/500000] + train/ActionNoiseL2Loss=0.1843 + throughput/total_tokens=314,112,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1637/500000] + train/ActionNoiseL2Loss=0.1112 + throughput/total_tokens=314,304,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1638/500000] + train/ActionNoiseL2Loss=0.2564 + throughput/total_tokens=314,496,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1639/500000] + train/ActionNoiseL2Loss=0.1226 + throughput/total_tokens=314,688,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1640/500000] + optim/total_grad_norm=5.411 + train/ActionNoiseL2Loss=0.1797 + throughput/total_tokens=314,880,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1641/500000] + train/ActionNoiseL2Loss=0.1063 + throughput/total_tokens=315,072,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1642/500000] + train/ActionNoiseL2Loss=0.1927 + throughput/total_tokens=315,264,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1643/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=315,456,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1644/500000] + train/ActionNoiseL2Loss=0.1191 + throughput/total_tokens=315,648,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1645/500000] + train/ActionNoiseL2Loss=0.1118 + throughput/total_tokens=315,840,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1646/500000] + train/ActionNoiseL2Loss=0.1259 + throughput/total_tokens=316,032,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1647/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=316,224,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1648/500000] + train/ActionNoiseL2Loss=0.1113 + throughput/total_tokens=316,416,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1649/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=316,608,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=1650/500000] + train/ActionNoiseL2Loss=0.1030 + throughput/total_tokens=316,800,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1651/500000] + train/ActionNoiseL2Loss=0.1462 + throughput/total_tokens=316,992,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1652/500000] + train/ActionNoiseL2Loss=0.0923 + throughput/total_tokens=317,184,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1653/500000] + train/ActionNoiseL2Loss=0.1074 + throughput/total_tokens=317,376,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1654/500000] + train/ActionNoiseL2Loss=0.1371 + throughput/total_tokens=317,568,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1655/500000] + train/ActionNoiseL2Loss=0.1469 + throughput/total_tokens=317,760,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1656/500000] + train/ActionNoiseL2Loss=0.1640 + throughput/total_tokens=317,952,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1657/500000] + train/ActionNoiseL2Loss=0.1721 + throughput/total_tokens=318,144,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1658/500000] + train/ActionNoiseL2Loss=0.1642 + throughput/total_tokens=318,336,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1659/500000] + train/ActionNoiseL2Loss=0.1630 + throughput/total_tokens=318,528,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1660/500000] + optim/total_grad_norm=2.560 + train/ActionNoiseL2Loss=0.1319 + throughput/total_tokens=318,720,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=1661/500000] + train/ActionNoiseL2Loss=0.2503 + throughput/total_tokens=318,912,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1662/500000] + train/ActionNoiseL2Loss=0.2029 + throughput/total_tokens=319,104,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1663/500000] + train/ActionNoiseL2Loss=0.2504 + throughput/total_tokens=319,296,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1664/500000] + train/ActionNoiseL2Loss=0.2322 + throughput/total_tokens=319,488,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1665/500000] + train/ActionNoiseL2Loss=0.1321 + throughput/total_tokens=319,680,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1666/500000] + train/ActionNoiseL2Loss=0.1421 + throughput/total_tokens=319,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1667/500000] + train/ActionNoiseL2Loss=0.1164 + throughput/total_tokens=320,064,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1668/500000] + train/ActionNoiseL2Loss=0.2014 + throughput/total_tokens=320,256,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1669/500000] + train/ActionNoiseL2Loss=0.1536 + throughput/total_tokens=320,448,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1670/500000] + train/ActionNoiseL2Loss=0.1146 + throughput/total_tokens=320,640,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1671/500000] + train/ActionNoiseL2Loss=0.1334 + throughput/total_tokens=320,832,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1672/500000] + train/ActionNoiseL2Loss=0.1116 + throughput/total_tokens=321,024,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1673/500000] + train/ActionNoiseL2Loss=0.0986 + throughput/total_tokens=321,216,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1674/500000] + train/ActionNoiseL2Loss=0.1503 + throughput/total_tokens=321,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1675/500000] + train/ActionNoiseL2Loss=0.1524 + throughput/total_tokens=321,600,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1676/500000] + train/ActionNoiseL2Loss=0.1580 + throughput/total_tokens=321,792,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1677/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=321,984,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1678/500000] + train/ActionNoiseL2Loss=0.1340 + throughput/total_tokens=322,176,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1679/500000] + train/ActionNoiseL2Loss=0.1691 + throughput/total_tokens=322,368,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1680/500000] + optim/total_grad_norm=3.090 + train/ActionNoiseL2Loss=0.1154 + throughput/total_tokens=322,560,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1681/500000] + train/ActionNoiseL2Loss=0.0894 + throughput/total_tokens=322,752,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1682/500000] + train/ActionNoiseL2Loss=0.1102 + throughput/total_tokens=322,944,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1683/500000] + train/ActionNoiseL2Loss=0.1213 + throughput/total_tokens=323,136,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1684/500000] + train/ActionNoiseL2Loss=0.1394 + throughput/total_tokens=323,328,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1685/500000] + train/ActionNoiseL2Loss=0.1739 + throughput/total_tokens=323,520,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1686/500000] + train/ActionNoiseL2Loss=0.1060 + throughput/total_tokens=323,712,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1687/500000] + train/ActionNoiseL2Loss=0.1590 + throughput/total_tokens=323,904,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1688/500000] + train/ActionNoiseL2Loss=0.1749 + throughput/total_tokens=324,096,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1689/500000] + train/ActionNoiseL2Loss=0.1058 + throughput/total_tokens=324,288,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1690/500000] + train/ActionNoiseL2Loss=0.1184 + throughput/total_tokens=324,480,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1691/500000] + train/ActionNoiseL2Loss=0.1636 + throughput/total_tokens=324,672,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1692/500000] + train/ActionNoiseL2Loss=0.1817 + throughput/total_tokens=324,864,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1693/500000] + train/ActionNoiseL2Loss=0.2001 + throughput/total_tokens=325,056,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1694/500000] + train/ActionNoiseL2Loss=0.1285 + throughput/total_tokens=325,248,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1695/500000] + train/ActionNoiseL2Loss=0.1204 + throughput/total_tokens=325,440,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1696/500000] + train/ActionNoiseL2Loss=0.2253 + throughput/total_tokens=325,632,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1697/500000] + train/ActionNoiseL2Loss=0.1715 + throughput/total_tokens=325,824,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1698/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=326,016,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1699/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=326,208,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1700/500000] + optim/total_grad_norm=2.885 + train/ActionNoiseL2Loss=0.1458 + throughput/total_tokens=326,400,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1701/500000] + train/ActionNoiseL2Loss=0.0876 + throughput/total_tokens=326,592,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1702/500000] + train/ActionNoiseL2Loss=0.1093 + throughput/total_tokens=326,784,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1703/500000] + train/ActionNoiseL2Loss=0.1399 + throughput/total_tokens=326,976,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1704/500000] + train/ActionNoiseL2Loss=0.1461 + throughput/total_tokens=327,168,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1705/500000] + train/ActionNoiseL2Loss=0.1069 + throughput/total_tokens=327,360,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1706/500000] + train/ActionNoiseL2Loss=0.1346 + throughput/total_tokens=327,552,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1707/500000] + train/ActionNoiseL2Loss=0.1635 + throughput/total_tokens=327,744,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1708/500000] + train/ActionNoiseL2Loss=0.1213 + throughput/total_tokens=327,936,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1709/500000] + train/ActionNoiseL2Loss=0.1072 + throughput/total_tokens=328,128,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1710/500000] + train/ActionNoiseL2Loss=0.1301 + throughput/total_tokens=328,320,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1711/500000] + train/ActionNoiseL2Loss=0.1343 + throughput/total_tokens=328,512,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1712/500000] + train/ActionNoiseL2Loss=0.1458 + throughput/total_tokens=328,704,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1713/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=328,896,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1714/500000] + train/ActionNoiseL2Loss=0.2677 + throughput/total_tokens=329,088,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1715/500000] + train/ActionNoiseL2Loss=0.0957 + throughput/total_tokens=329,280,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1716/500000] + train/ActionNoiseL2Loss=0.2067 + throughput/total_tokens=329,472,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1717/500000] + train/ActionNoiseL2Loss=0.2149 + throughput/total_tokens=329,664,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1718/500000] + train/ActionNoiseL2Loss=0.1603 + throughput/total_tokens=329,856,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1719/500000] + train/ActionNoiseL2Loss=0.1299 + throughput/total_tokens=330,048,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1720/500000] + optim/total_grad_norm=3.695 + train/ActionNoiseL2Loss=0.1661 + throughput/total_tokens=330,240,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1721/500000] + train/ActionNoiseL2Loss=0.2099 + throughput/total_tokens=330,432,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1722/500000] + train/ActionNoiseL2Loss=0.1639 + throughput/total_tokens=330,624,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1723/500000] + train/ActionNoiseL2Loss=0.1638 + throughput/total_tokens=330,816,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1724/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=331,008,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1725/500000] + train/ActionNoiseL2Loss=0.1460 + throughput/total_tokens=331,200,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1726/500000] + train/ActionNoiseL2Loss=0.1392 + throughput/total_tokens=331,392,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1727/500000] + train/ActionNoiseL2Loss=0.1502 + throughput/total_tokens=331,584,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1728/500000] + train/ActionNoiseL2Loss=0.1081 + throughput/total_tokens=331,776,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1729/500000] + train/ActionNoiseL2Loss=0.1587 + throughput/total_tokens=331,968,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1730/500000] + train/ActionNoiseL2Loss=0.1476 + throughput/total_tokens=332,160,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1731/500000] + train/ActionNoiseL2Loss=0.1181 + throughput/total_tokens=332,352,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1732/500000] + train/ActionNoiseL2Loss=0.0984 + throughput/total_tokens=332,544,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1733/500000] + train/ActionNoiseL2Loss=0.1203 + throughput/total_tokens=332,736,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1734/500000] + train/ActionNoiseL2Loss=0.1019 + throughput/total_tokens=332,928,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1735/500000] + train/ActionNoiseL2Loss=0.1962 + throughput/total_tokens=333,120,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1736/500000] + train/ActionNoiseL2Loss=0.1237 + throughput/total_tokens=333,312,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1737/500000] + train/ActionNoiseL2Loss=0.1138 + throughput/total_tokens=333,504,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1738/500000] + train/ActionNoiseL2Loss=0.1568 + throughput/total_tokens=333,696,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1739/500000] + train/ActionNoiseL2Loss=0.2321 + throughput/total_tokens=333,888,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1740/500000] + optim/total_grad_norm=2.737 + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=334,080,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1741/500000] + train/ActionNoiseL2Loss=0.1565 + throughput/total_tokens=334,272,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1742/500000] + train/ActionNoiseL2Loss=0.1445 + throughput/total_tokens=334,464,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1743/500000] + train/ActionNoiseL2Loss=0.1504 + throughput/total_tokens=334,656,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1744/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=334,848,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1745/500000] + train/ActionNoiseL2Loss=0.1396 + throughput/total_tokens=335,040,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1746/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=335,232,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1747/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=335,424,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1748/500000] + train/ActionNoiseL2Loss=0.0903 + throughput/total_tokens=335,616,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1749/500000] + train/ActionNoiseL2Loss=0.1057 + throughput/total_tokens=335,808,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1750/500000] + train/ActionNoiseL2Loss=0.2318 + throughput/total_tokens=336,000,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1751/500000] + train/ActionNoiseL2Loss=0.1077 + throughput/total_tokens=336,192,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1752/500000] + train/ActionNoiseL2Loss=0.1054 + throughput/total_tokens=336,384,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1753/500000] + train/ActionNoiseL2Loss=0.1193 + throughput/total_tokens=336,576,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1754/500000] + train/ActionNoiseL2Loss=0.1922 + throughput/total_tokens=336,768,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1755/500000] + train/ActionNoiseL2Loss=0.1000 + throughput/total_tokens=336,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1756/500000] + train/ActionNoiseL2Loss=0.1729 + throughput/total_tokens=337,152,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1757/500000] + train/ActionNoiseL2Loss=0.1190 + throughput/total_tokens=337,344,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1758/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=337,536,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1759/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=337,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1760/500000] + optim/total_grad_norm=2.172 + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=337,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=1761/500000] + train/ActionNoiseL2Loss=0.1302 + throughput/total_tokens=338,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1762/500000] + train/ActionNoiseL2Loss=0.1341 + throughput/total_tokens=338,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1763/500000] + train/ActionNoiseL2Loss=0.1635 + throughput/total_tokens=338,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1764/500000] + train/ActionNoiseL2Loss=0.1109 + throughput/total_tokens=338,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1765/500000] + train/ActionNoiseL2Loss=0.1318 + throughput/total_tokens=338,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1766/500000] + train/ActionNoiseL2Loss=0.1097 + throughput/total_tokens=339,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1767/500000] + train/ActionNoiseL2Loss=0.1484 + throughput/total_tokens=339,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1768/500000] + train/ActionNoiseL2Loss=0.1736 + throughput/total_tokens=339,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1769/500000] + train/ActionNoiseL2Loss=0.1023 + throughput/total_tokens=339,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1770/500000] + train/ActionNoiseL2Loss=0.1417 + throughput/total_tokens=339,840,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1771/500000] + train/ActionNoiseL2Loss=0.1378 + throughput/total_tokens=340,032,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1772/500000] + train/ActionNoiseL2Loss=0.0838 + throughput/total_tokens=340,224,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1773/500000] + train/ActionNoiseL2Loss=0.2256 + throughput/total_tokens=340,416,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1774/500000] + train/ActionNoiseL2Loss=0.1851 + throughput/total_tokens=340,608,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1775/500000] + train/ActionNoiseL2Loss=0.1077 + throughput/total_tokens=340,800,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1776/500000] + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=340,992,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1777/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=341,184,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1778/500000] + train/ActionNoiseL2Loss=0.1577 + throughput/total_tokens=341,376,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1779/500000] + train/ActionNoiseL2Loss=0.1890 + throughput/total_tokens=341,568,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1780/500000] + optim/total_grad_norm=3.931 + train/ActionNoiseL2Loss=0.1554 + throughput/total_tokens=341,760,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1781/500000] + train/ActionNoiseL2Loss=0.1439 + throughput/total_tokens=341,952,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1782/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=342,144,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1783/500000] + train/ActionNoiseL2Loss=0.1501 + throughput/total_tokens=342,336,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1784/500000] + train/ActionNoiseL2Loss=0.1652 + throughput/total_tokens=342,528,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1785/500000] + train/ActionNoiseL2Loss=0.1988 + throughput/total_tokens=342,720,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1786/500000] + train/ActionNoiseL2Loss=0.1254 + throughput/total_tokens=342,912,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1787/500000] + train/ActionNoiseL2Loss=0.1192 + throughput/total_tokens=343,104,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1788/500000] + train/ActionNoiseL2Loss=0.1111 + throughput/total_tokens=343,296,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1789/500000] + train/ActionNoiseL2Loss=0.0937 + throughput/total_tokens=343,488,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1790/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=343,680,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1791/500000] + train/ActionNoiseL2Loss=0.1597 + throughput/total_tokens=343,872,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1792/500000] + train/ActionNoiseL2Loss=0.1123 + throughput/total_tokens=344,064,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1793/500000] + train/ActionNoiseL2Loss=0.1090 + throughput/total_tokens=344,256,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1794/500000] + train/ActionNoiseL2Loss=0.1093 + throughput/total_tokens=344,448,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1795/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=344,640,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1796/500000] + train/ActionNoiseL2Loss=0.0926 + throughput/total_tokens=344,832,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1797/500000] + train/ActionNoiseL2Loss=0.1013 + throughput/total_tokens=345,024,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1798/500000] + train/ActionNoiseL2Loss=0.1313 + throughput/total_tokens=345,216,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1799/500000] + train/ActionNoiseL2Loss=0.1653 + throughput/total_tokens=345,408,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1800/500000] + optim/total_grad_norm=2.536 + train/ActionNoiseL2Loss=0.0937 + throughput/total_tokens=345,600,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1801/500000] + train/ActionNoiseL2Loss=0.1295 + throughput/total_tokens=345,792,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1802/500000] + train/ActionNoiseL2Loss=0.1065 + throughput/total_tokens=345,984,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1803/500000] + train/ActionNoiseL2Loss=0.1741 + throughput/total_tokens=346,176,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1804/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=346,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1805/500000] + train/ActionNoiseL2Loss=0.0980 + throughput/total_tokens=346,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1806/500000] + train/ActionNoiseL2Loss=0.1565 + throughput/total_tokens=346,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1807/500000] + train/ActionNoiseL2Loss=0.1182 + throughput/total_tokens=346,944,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1808/500000] + train/ActionNoiseL2Loss=0.1437 + throughput/total_tokens=347,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1809/500000] + train/ActionNoiseL2Loss=0.0968 + throughput/total_tokens=347,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1810/500000] + train/ActionNoiseL2Loss=0.1632 + throughput/total_tokens=347,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=1811/500000] + train/ActionNoiseL2Loss=0.1165 + throughput/total_tokens=347,712,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1812/500000] + train/ActionNoiseL2Loss=0.1053 + throughput/total_tokens=347,904,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1813/500000] + train/ActionNoiseL2Loss=0.1141 + throughput/total_tokens=348,096,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1814/500000] + train/ActionNoiseL2Loss=0.2125 + throughput/total_tokens=348,288,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1815/500000] + train/ActionNoiseL2Loss=0.1175 + throughput/total_tokens=348,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1816/500000] + train/ActionNoiseL2Loss=0.1148 + throughput/total_tokens=348,672,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1817/500000] + train/ActionNoiseL2Loss=0.0971 + throughput/total_tokens=348,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1818/500000] + train/ActionNoiseL2Loss=0.1440 + throughput/total_tokens=349,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1819/500000] + train/ActionNoiseL2Loss=0.0944 + throughput/total_tokens=349,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1820/500000] + optim/total_grad_norm=3.651 + train/ActionNoiseL2Loss=0.1508 + throughput/total_tokens=349,440,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1821/500000] + train/ActionNoiseL2Loss=0.1815 + throughput/total_tokens=349,632,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1822/500000] + train/ActionNoiseL2Loss=0.1069 + throughput/total_tokens=349,824,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1823/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=350,016,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1824/500000] + train/ActionNoiseL2Loss=0.1198 + throughput/total_tokens=350,208,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1825/500000] + train/ActionNoiseL2Loss=0.1326 + throughput/total_tokens=350,400,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1826/500000] + train/ActionNoiseL2Loss=0.2041 + throughput/total_tokens=350,592,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1827/500000] + train/ActionNoiseL2Loss=0.1293 + throughput/total_tokens=350,784,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1828/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=350,976,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1829/500000] + train/ActionNoiseL2Loss=0.1401 + throughput/total_tokens=351,168,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1830/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=351,360,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1831/500000] + train/ActionNoiseL2Loss=0.1162 + throughput/total_tokens=351,552,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1832/500000] + train/ActionNoiseL2Loss=0.0956 + throughput/total_tokens=351,744,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1833/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=351,936,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1834/500000] + train/ActionNoiseL2Loss=0.1420 + throughput/total_tokens=352,128,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1835/500000] + train/ActionNoiseL2Loss=0.0905 + throughput/total_tokens=352,320,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1836/500000] + train/ActionNoiseL2Loss=0.2113 + throughput/total_tokens=352,512,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1837/500000] + train/ActionNoiseL2Loss=0.1243 + throughput/total_tokens=352,704,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1838/500000] + train/ActionNoiseL2Loss=0.1436 + throughput/total_tokens=352,896,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1839/500000] + train/ActionNoiseL2Loss=0.1254 + throughput/total_tokens=353,088,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1840/500000] + optim/total_grad_norm=3.713 + train/ActionNoiseL2Loss=0.1206 + throughput/total_tokens=353,280,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1841/500000] + train/ActionNoiseL2Loss=0.1402 + throughput/total_tokens=353,472,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1842/500000] + train/ActionNoiseL2Loss=0.1261 + throughput/total_tokens=353,664,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1843/500000] + train/ActionNoiseL2Loss=0.1568 + throughput/total_tokens=353,856,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1844/500000] + train/ActionNoiseL2Loss=0.2829 + throughput/total_tokens=354,048,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1845/500000] + train/ActionNoiseL2Loss=0.0888 + throughput/total_tokens=354,240,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1846/500000] + train/ActionNoiseL2Loss=0.1366 + throughput/total_tokens=354,432,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1847/500000] + train/ActionNoiseL2Loss=0.1358 + throughput/total_tokens=354,624,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1848/500000] + train/ActionNoiseL2Loss=0.1399 + throughput/total_tokens=354,816,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1849/500000] + train/ActionNoiseL2Loss=0.1125 + throughput/total_tokens=355,008,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1850/500000] + train/ActionNoiseL2Loss=0.1951 + throughput/total_tokens=355,200,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1851/500000] + train/ActionNoiseL2Loss=0.1222 + throughput/total_tokens=355,392,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1852/500000] + train/ActionNoiseL2Loss=0.1231 + throughput/total_tokens=355,584,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1853/500000] + train/ActionNoiseL2Loss=0.1905 + throughput/total_tokens=355,776,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1854/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=355,968,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1855/500000] + train/ActionNoiseL2Loss=0.1543 + throughput/total_tokens=356,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1856/500000] + train/ActionNoiseL2Loss=0.1692 + throughput/total_tokens=356,352,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1857/500000] + train/ActionNoiseL2Loss=0.2076 + throughput/total_tokens=356,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1858/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=356,736,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1859/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=356,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1860/500000] + optim/total_grad_norm=3.608 + train/ActionNoiseL2Loss=0.1795 + throughput/total_tokens=357,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=1861/500000] + train/ActionNoiseL2Loss=0.1321 + throughput/total_tokens=357,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1862/500000] + train/ActionNoiseL2Loss=0.1945 + throughput/total_tokens=357,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1863/500000] + train/ActionNoiseL2Loss=0.0979 + throughput/total_tokens=357,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1864/500000] + train/ActionNoiseL2Loss=0.0996 + throughput/total_tokens=357,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1865/500000] + train/ActionNoiseL2Loss=0.1623 + throughput/total_tokens=358,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1866/500000] + train/ActionNoiseL2Loss=0.1499 + throughput/total_tokens=358,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1867/500000] + train/ActionNoiseL2Loss=0.1300 + throughput/total_tokens=358,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1868/500000] + train/ActionNoiseL2Loss=0.1119 + throughput/total_tokens=358,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1869/500000] + train/ActionNoiseL2Loss=0.0918 + throughput/total_tokens=358,848,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1870/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=359,040,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1871/500000] + train/ActionNoiseL2Loss=0.1708 + throughput/total_tokens=359,232,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1872/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=359,424,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1873/500000] + train/ActionNoiseL2Loss=0.1244 + throughput/total_tokens=359,616,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1874/500000] + train/ActionNoiseL2Loss=0.0788 + throughput/total_tokens=359,808,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1875/500000] + train/ActionNoiseL2Loss=0.1154 + throughput/total_tokens=360,000,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1876/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=360,192,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1877/500000] + train/ActionNoiseL2Loss=0.1579 + throughput/total_tokens=360,384,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1878/500000] + train/ActionNoiseL2Loss=0.0838 + throughput/total_tokens=360,576,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1879/500000] + train/ActionNoiseL2Loss=0.1261 + throughput/total_tokens=360,768,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1880/500000] + optim/total_grad_norm=2.563 + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=360,960,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1881/500000] + train/ActionNoiseL2Loss=0.1040 + throughput/total_tokens=361,152,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1882/500000] + train/ActionNoiseL2Loss=0.1960 + throughput/total_tokens=361,344,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1883/500000] + train/ActionNoiseL2Loss=0.0981 + throughput/total_tokens=361,536,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1884/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=361,728,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1885/500000] + train/ActionNoiseL2Loss=0.1482 + throughput/total_tokens=361,920,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1886/500000] + train/ActionNoiseL2Loss=0.1608 + throughput/total_tokens=362,112,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1887/500000] + train/ActionNoiseL2Loss=0.1150 + throughput/total_tokens=362,304,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1888/500000] + train/ActionNoiseL2Loss=0.1391 + throughput/total_tokens=362,496,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1889/500000] + train/ActionNoiseL2Loss=0.1277 + throughput/total_tokens=362,688,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1890/500000] + train/ActionNoiseL2Loss=0.0932 + throughput/total_tokens=362,880,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1891/500000] + train/ActionNoiseL2Loss=0.1806 + throughput/total_tokens=363,072,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1892/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=363,264,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1893/500000] + train/ActionNoiseL2Loss=0.1013 + throughput/total_tokens=363,456,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1894/500000] + train/ActionNoiseL2Loss=0.0982 + throughput/total_tokens=363,648,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1895/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=363,840,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1896/500000] + train/ActionNoiseL2Loss=0.1626 + throughput/total_tokens=364,032,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1897/500000] + train/ActionNoiseL2Loss=0.1163 + throughput/total_tokens=364,224,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1898/500000] + train/ActionNoiseL2Loss=0.1108 + throughput/total_tokens=364,416,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1899/500000] + train/ActionNoiseL2Loss=0.1791 + throughput/total_tokens=364,608,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1900/500000] + optim/total_grad_norm=2.895 + train/ActionNoiseL2Loss=0.1012 + throughput/total_tokens=364,800,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1901/500000] + train/ActionNoiseL2Loss=0.2735 + throughput/total_tokens=364,992,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1902/500000] + train/ActionNoiseL2Loss=0.1300 + throughput/total_tokens=365,184,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1903/500000] + train/ActionNoiseL2Loss=0.1177 + throughput/total_tokens=365,376,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1904/500000] + train/ActionNoiseL2Loss=0.1314 + throughput/total_tokens=365,568,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1905/500000] + train/ActionNoiseL2Loss=0.1926 + throughput/total_tokens=365,760,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1906/500000] + train/ActionNoiseL2Loss=0.1772 + throughput/total_tokens=365,952,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1907/500000] + train/ActionNoiseL2Loss=0.1329 + throughput/total_tokens=366,144,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1908/500000] + train/ActionNoiseL2Loss=0.0928 + throughput/total_tokens=366,336,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1909/500000] + train/ActionNoiseL2Loss=0.1433 + throughput/total_tokens=366,528,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1910/500000] + train/ActionNoiseL2Loss=0.1115 + throughput/total_tokens=366,720,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1911/500000] + train/ActionNoiseL2Loss=0.1214 + throughput/total_tokens=366,912,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1912/500000] + train/ActionNoiseL2Loss=0.1241 + throughput/total_tokens=367,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1913/500000] + train/ActionNoiseL2Loss=0.1061 + throughput/total_tokens=367,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1914/500000] + train/ActionNoiseL2Loss=0.0851 + throughput/total_tokens=367,488,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1915/500000] + train/ActionNoiseL2Loss=0.1109 + throughput/total_tokens=367,680,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1916/500000] + train/ActionNoiseL2Loss=0.1113 + throughput/total_tokens=367,872,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1917/500000] + train/ActionNoiseL2Loss=0.1086 + throughput/total_tokens=368,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1918/500000] + train/ActionNoiseL2Loss=0.1718 + throughput/total_tokens=368,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1919/500000] + train/ActionNoiseL2Loss=0.1100 + throughput/total_tokens=368,448,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1920/500000] + optim/total_grad_norm=3.172 + train/ActionNoiseL2Loss=0.1967 + throughput/total_tokens=368,640,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1921/500000] + train/ActionNoiseL2Loss=0.1958 + throughput/total_tokens=368,832,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1922/500000] + train/ActionNoiseL2Loss=0.0957 + throughput/total_tokens=369,024,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1923/500000] + train/ActionNoiseL2Loss=0.1350 + throughput/total_tokens=369,216,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1924/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=369,408,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1925/500000] + train/ActionNoiseL2Loss=0.0976 + throughput/total_tokens=369,600,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1926/500000] + train/ActionNoiseL2Loss=0.1789 + throughput/total_tokens=369,792,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1927/500000] + train/ActionNoiseL2Loss=0.1694 + throughput/total_tokens=369,984,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1928/500000] + train/ActionNoiseL2Loss=0.1036 + throughput/total_tokens=370,176,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1929/500000] + train/ActionNoiseL2Loss=0.1743 + throughput/total_tokens=370,368,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1930/500000] + train/ActionNoiseL2Loss=0.0945 + throughput/total_tokens=370,560,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1931/500000] + train/ActionNoiseL2Loss=0.1447 + throughput/total_tokens=370,752,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1932/500000] + train/ActionNoiseL2Loss=0.1491 + throughput/total_tokens=370,944,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1933/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=371,136,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1934/500000] + train/ActionNoiseL2Loss=0.1134 + throughput/total_tokens=371,328,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1935/500000] + train/ActionNoiseL2Loss=0.0881 + throughput/total_tokens=371,520,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1936/500000] + train/ActionNoiseL2Loss=0.1183 + throughput/total_tokens=371,712,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1937/500000] + train/ActionNoiseL2Loss=0.1025 + throughput/total_tokens=371,904,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1938/500000] + train/ActionNoiseL2Loss=0.1646 + throughput/total_tokens=372,096,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1939/500000] + train/ActionNoiseL2Loss=0.1564 + throughput/total_tokens=372,288,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1940/500000] + optim/total_grad_norm=3.090 + train/ActionNoiseL2Loss=0.1506 + throughput/total_tokens=372,480,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1941/500000] + train/ActionNoiseL2Loss=0.1082 + throughput/total_tokens=372,672,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1942/500000] + train/ActionNoiseL2Loss=0.1020 + throughput/total_tokens=372,864,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1943/500000] + train/ActionNoiseL2Loss=0.1153 + throughput/total_tokens=373,056,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1944/500000] + train/ActionNoiseL2Loss=0.1683 + throughput/total_tokens=373,248,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1945/500000] + train/ActionNoiseL2Loss=0.1647 + throughput/total_tokens=373,440,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1946/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=373,632,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1947/500000] + train/ActionNoiseL2Loss=0.1318 + throughput/total_tokens=373,824,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1948/500000] + train/ActionNoiseL2Loss=0.1052 + throughput/total_tokens=374,016,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1949/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=374,208,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=1950/500000] + train/ActionNoiseL2Loss=0.1035 + throughput/total_tokens=374,400,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=1951/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=374,592,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1952/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=374,784,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1953/500000] + train/ActionNoiseL2Loss=0.1325 + throughput/total_tokens=374,976,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1954/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=375,168,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1955/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=375,360,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1956/500000] + train/ActionNoiseL2Loss=0.1058 + throughput/total_tokens=375,552,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1957/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=375,744,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1958/500000] + train/ActionNoiseL2Loss=0.1389 + throughput/total_tokens=375,936,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1959/500000] + train/ActionNoiseL2Loss=0.1786 + throughput/total_tokens=376,128,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1960/500000] + optim/total_grad_norm=3.030 + train/ActionNoiseL2Loss=0.1322 + throughput/total_tokens=376,320,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=1961/500000] + train/ActionNoiseL2Loss=0.1293 + throughput/total_tokens=376,512,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1962/500000] + train/ActionNoiseL2Loss=0.1277 + throughput/total_tokens=376,704,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1963/500000] + train/ActionNoiseL2Loss=0.1400 + throughput/total_tokens=376,896,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1964/500000] + train/ActionNoiseL2Loss=0.1368 + throughput/total_tokens=377,088,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1965/500000] + train/ActionNoiseL2Loss=0.1214 + throughput/total_tokens=377,280,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=1966/500000] + train/ActionNoiseL2Loss=0.0833 + throughput/total_tokens=377,472,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=1967/500000] + train/ActionNoiseL2Loss=0.1111 + throughput/total_tokens=377,664,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1968/500000] + train/ActionNoiseL2Loss=0.1140 + throughput/total_tokens=377,856,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1969/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=378,048,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1970/500000] + train/ActionNoiseL2Loss=0.1652 + throughput/total_tokens=378,240,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=1971/500000] + train/ActionNoiseL2Loss=0.0858 + throughput/total_tokens=378,432,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=1972/500000] + train/ActionNoiseL2Loss=0.1995 + throughput/total_tokens=378,624,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1973/500000] + train/ActionNoiseL2Loss=0.1127 + throughput/total_tokens=378,816,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1974/500000] + train/ActionNoiseL2Loss=0.1974 + throughput/total_tokens=379,008,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1975/500000] + train/ActionNoiseL2Loss=0.1580 + throughput/total_tokens=379,200,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1976/500000] + train/ActionNoiseL2Loss=0.0851 + throughput/total_tokens=379,392,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1977/500000] + train/ActionNoiseL2Loss=0.2004 + throughput/total_tokens=379,584,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1978/500000] + train/ActionNoiseL2Loss=0.1556 + throughput/total_tokens=379,776,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=1979/500000] + train/ActionNoiseL2Loss=0.1542 + throughput/total_tokens=379,968,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=1980/500000] + optim/total_grad_norm=3.497 + train/ActionNoiseL2Loss=0.1271 + throughput/total_tokens=380,160,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=1981/500000] + train/ActionNoiseL2Loss=0.1494 + throughput/total_tokens=380,352,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=1982/500000] + train/ActionNoiseL2Loss=0.1642 + throughput/total_tokens=380,544,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=1983/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=380,736,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=1984/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=380,928,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=1985/500000] + train/ActionNoiseL2Loss=0.1188 + throughput/total_tokens=381,120,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=1986/500000] + train/ActionNoiseL2Loss=0.2034 + throughput/total_tokens=381,312,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=1987/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=381,504,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=1988/500000] + train/ActionNoiseL2Loss=0.2124 + throughput/total_tokens=381,696,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=1989/500000] + train/ActionNoiseL2Loss=0.0994 + throughput/total_tokens=381,888,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=1990/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=382,080,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=1991/500000] + train/ActionNoiseL2Loss=0.1488 + throughput/total_tokens=382,272,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=1992/500000] + train/ActionNoiseL2Loss=0.1555 + throughput/total_tokens=382,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=1993/500000] + train/ActionNoiseL2Loss=0.1371 + throughput/total_tokens=382,656,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=1994/500000] + train/ActionNoiseL2Loss=0.1935 + throughput/total_tokens=382,848,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1995/500000] + train/ActionNoiseL2Loss=0.1941 + throughput/total_tokens=383,040,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1996/500000] + train/ActionNoiseL2Loss=0.1108 + throughput/total_tokens=383,232,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1997/500000] + train/ActionNoiseL2Loss=0.1082 + throughput/total_tokens=383,424,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1998/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=383,616,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=1999/500000] + train/ActionNoiseL2Loss=0.0772 + throughput/total_tokens=383,808,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2000/500000] + optim/total_grad_norm=2.394 + train/ActionNoiseL2Loss=0.1038 + throughput/total_tokens=384,000,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +10/06 [04:31:17] INFO | >> Saving config... checkpoint.py:608 +10/06 [04:31:59] INFO | >> Saving model state... checkpoint.py:796 +10/06 [04:33:06] INFO | >> Saving optim state... checkpoint.py:811 +10/06 [04:34:37] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=2001/500000] + train/ActionNoiseL2Loss=0.1388 + throughput/total_tokens=384,192,000 + throughput/device/tokens_per_second=1,195 + throughput/device/batches_per_second=0.0498 +[step=2002/500000] + train/ActionNoiseL2Loss=0.1943 + throughput/total_tokens=384,384,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=2003/500000] + train/ActionNoiseL2Loss=0.0937 + throughput/total_tokens=384,576,000 + throughput/device/tokens_per_second=1,165 + throughput/device/batches_per_second=0.0486 +[step=2004/500000] + train/ActionNoiseL2Loss=0.1061 + throughput/total_tokens=384,768,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0485 +[step=2005/500000] + train/ActionNoiseL2Loss=0.2068 + throughput/total_tokens=384,960,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=2006/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=385,152,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=2007/500000] + train/ActionNoiseL2Loss=0.0926 + throughput/total_tokens=385,344,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=2008/500000] + train/ActionNoiseL2Loss=0.1068 + throughput/total_tokens=385,536,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=2009/500000] + train/ActionNoiseL2Loss=0.1374 + throughput/total_tokens=385,728,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=2010/500000] + train/ActionNoiseL2Loss=0.1627 + throughput/total_tokens=385,920,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=2011/500000] + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=386,112,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2012/500000] + train/ActionNoiseL2Loss=0.2382 + throughput/total_tokens=386,304,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2013/500000] + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=386,496,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2014/500000] + train/ActionNoiseL2Loss=0.0963 + throughput/total_tokens=386,688,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2015/500000] + train/ActionNoiseL2Loss=0.1028 + throughput/total_tokens=386,880,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2016/500000] + train/ActionNoiseL2Loss=0.1119 + throughput/total_tokens=387,072,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2017/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=387,264,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2018/500000] + train/ActionNoiseL2Loss=0.1004 + throughput/total_tokens=387,456,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2019/500000] + train/ActionNoiseL2Loss=0.0965 + throughput/total_tokens=387,648,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2020/500000] + optim/total_grad_norm=3.332 + train/ActionNoiseL2Loss=0.1333 + throughput/total_tokens=387,840,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2021/500000] + train/ActionNoiseL2Loss=0.0973 + throughput/total_tokens=388,032,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2022/500000] + train/ActionNoiseL2Loss=0.0843 + throughput/total_tokens=388,224,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2023/500000] + train/ActionNoiseL2Loss=0.1461 + throughput/total_tokens=388,416,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2024/500000] + train/ActionNoiseL2Loss=0.1190 + throughput/total_tokens=388,608,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2025/500000] + train/ActionNoiseL2Loss=0.1802 + throughput/total_tokens=388,800,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2026/500000] + train/ActionNoiseL2Loss=0.1147 + throughput/total_tokens=388,992,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2027/500000] + train/ActionNoiseL2Loss=0.1109 + throughput/total_tokens=389,184,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2028/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=389,376,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2029/500000] + train/ActionNoiseL2Loss=0.1606 + throughput/total_tokens=389,568,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2030/500000] + train/ActionNoiseL2Loss=0.1517 + throughput/total_tokens=389,760,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2031/500000] + train/ActionNoiseL2Loss=0.1157 + throughput/total_tokens=389,952,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2032/500000] + train/ActionNoiseL2Loss=0.0995 + throughput/total_tokens=390,144,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2033/500000] + train/ActionNoiseL2Loss=0.0987 + throughput/total_tokens=390,336,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2034/500000] + train/ActionNoiseL2Loss=0.1787 + throughput/total_tokens=390,528,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2035/500000] + train/ActionNoiseL2Loss=0.1352 + throughput/total_tokens=390,720,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2036/500000] + train/ActionNoiseL2Loss=0.1688 + throughput/total_tokens=390,912,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2037/500000] + train/ActionNoiseL2Loss=0.1103 + throughput/total_tokens=391,104,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2038/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=391,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2039/500000] + train/ActionNoiseL2Loss=0.1678 + throughput/total_tokens=391,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2040/500000] + optim/total_grad_norm=4.160 + train/ActionNoiseL2Loss=0.1970 + throughput/total_tokens=391,680,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2041/500000] + train/ActionNoiseL2Loss=0.1369 + throughput/total_tokens=391,872,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2042/500000] + train/ActionNoiseL2Loss=0.0914 + throughput/total_tokens=392,064,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2043/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=392,256,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2044/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=392,448,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2045/500000] + train/ActionNoiseL2Loss=0.1115 + throughput/total_tokens=392,640,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2046/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=392,832,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2047/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=393,024,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2048/500000] + train/ActionNoiseL2Loss=0.1124 + throughput/total_tokens=393,216,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2049/500000] + train/ActionNoiseL2Loss=0.1006 + throughput/total_tokens=393,408,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2050/500000] + train/ActionNoiseL2Loss=0.1533 + throughput/total_tokens=393,600,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2051/500000] + train/ActionNoiseL2Loss=0.1183 + throughput/total_tokens=393,792,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2052/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=393,984,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2053/500000] + train/ActionNoiseL2Loss=0.1531 + throughput/total_tokens=394,176,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2054/500000] + train/ActionNoiseL2Loss=0.1035 + throughput/total_tokens=394,368,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2055/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=394,560,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2056/500000] + train/ActionNoiseL2Loss=0.0988 + throughput/total_tokens=394,752,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2057/500000] + train/ActionNoiseL2Loss=0.1990 + throughput/total_tokens=394,944,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2058/500000] + train/ActionNoiseL2Loss=0.1626 + throughput/total_tokens=395,136,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2059/500000] + train/ActionNoiseL2Loss=0.0955 + throughput/total_tokens=395,328,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2060/500000] + optim/total_grad_norm=3.452 + train/ActionNoiseL2Loss=0.1572 + throughput/total_tokens=395,520,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=2061/500000] + train/ActionNoiseL2Loss=0.0968 + throughput/total_tokens=395,712,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2062/500000] + train/ActionNoiseL2Loss=0.1112 + throughput/total_tokens=395,904,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2063/500000] + train/ActionNoiseL2Loss=0.1276 + throughput/total_tokens=396,096,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2064/500000] + train/ActionNoiseL2Loss=0.2292 + throughput/total_tokens=396,288,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2065/500000] + train/ActionNoiseL2Loss=0.1034 + throughput/total_tokens=396,480,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2066/500000] + train/ActionNoiseL2Loss=0.1004 + throughput/total_tokens=396,672,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2067/500000] + train/ActionNoiseL2Loss=0.0988 + throughput/total_tokens=396,864,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2068/500000] + train/ActionNoiseL2Loss=0.1571 + throughput/total_tokens=397,056,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2069/500000] + train/ActionNoiseL2Loss=0.1473 + throughput/total_tokens=397,248,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2070/500000] + train/ActionNoiseL2Loss=0.1113 + throughput/total_tokens=397,440,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2071/500000] + train/ActionNoiseL2Loss=0.1113 + throughput/total_tokens=397,632,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2072/500000] + train/ActionNoiseL2Loss=0.1048 + throughput/total_tokens=397,824,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2073/500000] + train/ActionNoiseL2Loss=0.1733 + throughput/total_tokens=398,016,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2074/500000] + train/ActionNoiseL2Loss=0.0956 + throughput/total_tokens=398,208,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2075/500000] + train/ActionNoiseL2Loss=0.1307 + throughput/total_tokens=398,400,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2076/500000] + train/ActionNoiseL2Loss=0.1278 + throughput/total_tokens=398,592,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2077/500000] + train/ActionNoiseL2Loss=0.1409 + throughput/total_tokens=398,784,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2078/500000] + train/ActionNoiseL2Loss=0.1228 + throughput/total_tokens=398,976,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2079/500000] + train/ActionNoiseL2Loss=0.1183 + throughput/total_tokens=399,168,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2080/500000] + optim/total_grad_norm=2.135 + train/ActionNoiseL2Loss=0.0992 + throughput/total_tokens=399,360,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2081/500000] + train/ActionNoiseL2Loss=0.1585 + throughput/total_tokens=399,552,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2082/500000] + train/ActionNoiseL2Loss=0.1894 + throughput/total_tokens=399,744,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2083/500000] + train/ActionNoiseL2Loss=0.1065 + throughput/total_tokens=399,936,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2084/500000] + train/ActionNoiseL2Loss=0.1225 + throughput/total_tokens=400,128,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2085/500000] + train/ActionNoiseL2Loss=0.0788 + throughput/total_tokens=400,320,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2086/500000] + train/ActionNoiseL2Loss=0.1301 + throughput/total_tokens=400,512,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2087/500000] + train/ActionNoiseL2Loss=0.1067 + throughput/total_tokens=400,704,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2088/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=400,896,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2089/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=401,088,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2090/500000] + train/ActionNoiseL2Loss=0.1213 + throughput/total_tokens=401,280,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2091/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=401,472,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2092/500000] + train/ActionNoiseL2Loss=0.1061 + throughput/total_tokens=401,664,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2093/500000] + train/ActionNoiseL2Loss=0.1282 + throughput/total_tokens=401,856,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2094/500000] + train/ActionNoiseL2Loss=0.1009 + throughput/total_tokens=402,048,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2095/500000] + train/ActionNoiseL2Loss=0.1004 + throughput/total_tokens=402,240,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2096/500000] + train/ActionNoiseL2Loss=0.1378 + throughput/total_tokens=402,432,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2097/500000] + train/ActionNoiseL2Loss=0.1136 + throughput/total_tokens=402,624,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2098/500000] + train/ActionNoiseL2Loss=0.1039 + throughput/total_tokens=402,816,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2099/500000] + train/ActionNoiseL2Loss=0.1048 + throughput/total_tokens=403,008,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2100/500000] + optim/total_grad_norm=2.411 + train/ActionNoiseL2Loss=0.1007 + throughput/total_tokens=403,200,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2101/500000] + train/ActionNoiseL2Loss=0.1786 + throughput/total_tokens=403,392,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2102/500000] + train/ActionNoiseL2Loss=0.0898 + throughput/total_tokens=403,584,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2103/500000] + train/ActionNoiseL2Loss=0.0931 + throughput/total_tokens=403,776,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2104/500000] + train/ActionNoiseL2Loss=0.1207 + throughput/total_tokens=403,968,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2105/500000] + train/ActionNoiseL2Loss=0.0992 + throughput/total_tokens=404,160,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2106/500000] + train/ActionNoiseL2Loss=0.0970 + throughput/total_tokens=404,352,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2107/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=404,544,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2108/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=404,736,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2109/500000] + train/ActionNoiseL2Loss=0.1155 + throughput/total_tokens=404,928,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2110/500000] + train/ActionNoiseL2Loss=0.1469 + throughput/total_tokens=405,120,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=2111/500000] + train/ActionNoiseL2Loss=0.1114 + throughput/total_tokens=405,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2112/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=405,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2113/500000] + train/ActionNoiseL2Loss=0.1540 + throughput/total_tokens=405,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2114/500000] + train/ActionNoiseL2Loss=0.1466 + throughput/total_tokens=405,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2115/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=406,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2116/500000] + train/ActionNoiseL2Loss=0.1559 + throughput/total_tokens=406,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2117/500000] + train/ActionNoiseL2Loss=0.1540 + throughput/total_tokens=406,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2118/500000] + train/ActionNoiseL2Loss=0.1641 + throughput/total_tokens=406,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2119/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=406,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2120/500000] + optim/total_grad_norm=2.353 + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=407,040,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2121/500000] + train/ActionNoiseL2Loss=0.1012 + throughput/total_tokens=407,232,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2122/500000] + train/ActionNoiseL2Loss=0.1493 + throughput/total_tokens=407,424,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2123/500000] + train/ActionNoiseL2Loss=0.1331 + throughput/total_tokens=407,616,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2124/500000] + train/ActionNoiseL2Loss=0.1459 + throughput/total_tokens=407,808,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2125/500000] + train/ActionNoiseL2Loss=0.1253 + throughput/total_tokens=408,000,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2126/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=408,192,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2127/500000] + train/ActionNoiseL2Loss=0.1001 + throughput/total_tokens=408,384,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2128/500000] + train/ActionNoiseL2Loss=0.1557 + throughput/total_tokens=408,576,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2129/500000] + train/ActionNoiseL2Loss=0.1778 + throughput/total_tokens=408,768,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2130/500000] + train/ActionNoiseL2Loss=0.1371 + throughput/total_tokens=408,960,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2131/500000] + train/ActionNoiseL2Loss=0.1025 + throughput/total_tokens=409,152,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2132/500000] + train/ActionNoiseL2Loss=0.0942 + throughput/total_tokens=409,344,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2133/500000] + train/ActionNoiseL2Loss=0.1267 + throughput/total_tokens=409,536,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2134/500000] + train/ActionNoiseL2Loss=0.1800 + throughput/total_tokens=409,728,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2135/500000] + train/ActionNoiseL2Loss=0.1554 + throughput/total_tokens=409,920,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2136/500000] + train/ActionNoiseL2Loss=0.1042 + throughput/total_tokens=410,112,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2137/500000] + train/ActionNoiseL2Loss=0.1841 + throughput/total_tokens=410,304,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2138/500000] + train/ActionNoiseL2Loss=0.1521 + throughput/total_tokens=410,496,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2139/500000] + train/ActionNoiseL2Loss=0.1094 + throughput/total_tokens=410,688,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2140/500000] + optim/total_grad_norm=2.553 + train/ActionNoiseL2Loss=0.1120 + throughput/total_tokens=410,880,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2141/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=411,072,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2142/500000] + train/ActionNoiseL2Loss=0.0936 + throughput/total_tokens=411,264,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2143/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=411,456,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2144/500000] + train/ActionNoiseL2Loss=0.1442 + throughput/total_tokens=411,648,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2145/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=411,840,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2146/500000] + train/ActionNoiseL2Loss=0.0899 + throughput/total_tokens=412,032,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2147/500000] + train/ActionNoiseL2Loss=0.1175 + throughput/total_tokens=412,224,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2148/500000] + train/ActionNoiseL2Loss=0.0926 + throughput/total_tokens=412,416,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2149/500000] + train/ActionNoiseL2Loss=0.1300 + throughput/total_tokens=412,608,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2150/500000] + train/ActionNoiseL2Loss=0.2609 + throughput/total_tokens=412,800,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2151/500000] + train/ActionNoiseL2Loss=0.1591 + throughput/total_tokens=412,992,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2152/500000] + train/ActionNoiseL2Loss=0.1527 + throughput/total_tokens=413,184,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2153/500000] + train/ActionNoiseL2Loss=0.1308 + throughput/total_tokens=413,376,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2154/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=413,568,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2155/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=413,760,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2156/500000] + train/ActionNoiseL2Loss=0.0895 + throughput/total_tokens=413,952,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2157/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=414,144,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2158/500000] + train/ActionNoiseL2Loss=0.1256 + throughput/total_tokens=414,336,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2159/500000] + train/ActionNoiseL2Loss=0.1474 + throughput/total_tokens=414,528,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2160/500000] + optim/total_grad_norm=2.634 + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=414,720,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=2161/500000] + train/ActionNoiseL2Loss=0.1157 + throughput/total_tokens=414,912,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2162/500000] + train/ActionNoiseL2Loss=0.1157 + throughput/total_tokens=415,104,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2163/500000] + train/ActionNoiseL2Loss=0.1249 + throughput/total_tokens=415,296,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2164/500000] + train/ActionNoiseL2Loss=0.0922 + throughput/total_tokens=415,488,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2165/500000] + train/ActionNoiseL2Loss=0.0992 + throughput/total_tokens=415,680,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2166/500000] + train/ActionNoiseL2Loss=0.1524 + throughput/total_tokens=415,872,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2167/500000] + train/ActionNoiseL2Loss=0.1050 + throughput/total_tokens=416,064,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2168/500000] + train/ActionNoiseL2Loss=0.1220 + throughput/total_tokens=416,256,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2169/500000] + train/ActionNoiseL2Loss=0.1485 + throughput/total_tokens=416,448,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2170/500000] + train/ActionNoiseL2Loss=0.1172 + throughput/total_tokens=416,640,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2171/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=416,832,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2172/500000] + train/ActionNoiseL2Loss=0.1769 + throughput/total_tokens=417,024,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2173/500000] + train/ActionNoiseL2Loss=0.1027 + throughput/total_tokens=417,216,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2174/500000] + train/ActionNoiseL2Loss=0.1474 + throughput/total_tokens=417,408,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2175/500000] + train/ActionNoiseL2Loss=0.1725 + throughput/total_tokens=417,600,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2176/500000] + train/ActionNoiseL2Loss=0.1316 + throughput/total_tokens=417,792,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2177/500000] + train/ActionNoiseL2Loss=0.2520 + throughput/total_tokens=417,984,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2178/500000] + train/ActionNoiseL2Loss=0.1006 + throughput/total_tokens=418,176,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2179/500000] + train/ActionNoiseL2Loss=0.2351 + throughput/total_tokens=418,368,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2180/500000] + optim/total_grad_norm=2.868 + train/ActionNoiseL2Loss=0.1289 + throughput/total_tokens=418,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2181/500000] + train/ActionNoiseL2Loss=0.0877 + throughput/total_tokens=418,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2182/500000] + train/ActionNoiseL2Loss=0.1121 + throughput/total_tokens=418,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2183/500000] + train/ActionNoiseL2Loss=0.1102 + throughput/total_tokens=419,136,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2184/500000] + train/ActionNoiseL2Loss=0.1605 + throughput/total_tokens=419,328,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2185/500000] + train/ActionNoiseL2Loss=0.1019 + throughput/total_tokens=419,520,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2186/500000] + train/ActionNoiseL2Loss=0.1020 + throughput/total_tokens=419,712,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2187/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=419,904,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2188/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=420,096,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2189/500000] + train/ActionNoiseL2Loss=0.1162 + throughput/total_tokens=420,288,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2190/500000] + train/ActionNoiseL2Loss=0.1491 + throughput/total_tokens=420,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2191/500000] + train/ActionNoiseL2Loss=0.1273 + throughput/total_tokens=420,672,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2192/500000] + train/ActionNoiseL2Loss=0.1476 + throughput/total_tokens=420,864,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2193/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=421,056,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2194/500000] + train/ActionNoiseL2Loss=0.1822 + throughput/total_tokens=421,248,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2195/500000] + train/ActionNoiseL2Loss=0.1309 + throughput/total_tokens=421,440,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2196/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=421,632,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2197/500000] + train/ActionNoiseL2Loss=0.1417 + throughput/total_tokens=421,824,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2198/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=422,016,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2199/500000] + train/ActionNoiseL2Loss=0.1481 + throughput/total_tokens=422,208,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2200/500000] + optim/total_grad_norm=2.896 + train/ActionNoiseL2Loss=0.1318 + throughput/total_tokens=422,400,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2201/500000] + train/ActionNoiseL2Loss=0.1041 + throughput/total_tokens=422,592,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2202/500000] + train/ActionNoiseL2Loss=0.0915 + throughput/total_tokens=422,784,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2203/500000] + train/ActionNoiseL2Loss=0.1144 + throughput/total_tokens=422,976,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2204/500000] + train/ActionNoiseL2Loss=0.0916 + throughput/total_tokens=423,168,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2205/500000] + train/ActionNoiseL2Loss=0.1662 + throughput/total_tokens=423,360,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2206/500000] + train/ActionNoiseL2Loss=0.1036 + throughput/total_tokens=423,552,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2207/500000] + train/ActionNoiseL2Loss=0.1003 + throughput/total_tokens=423,744,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2208/500000] + train/ActionNoiseL2Loss=0.1479 + throughput/total_tokens=423,936,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2209/500000] + train/ActionNoiseL2Loss=0.1420 + throughput/total_tokens=424,128,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2210/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=424,320,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2211/500000] + train/ActionNoiseL2Loss=0.1041 + throughput/total_tokens=424,512,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2212/500000] + train/ActionNoiseL2Loss=0.0927 + throughput/total_tokens=424,704,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2213/500000] + train/ActionNoiseL2Loss=0.1006 + throughput/total_tokens=424,896,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2214/500000] + train/ActionNoiseL2Loss=0.0944 + throughput/total_tokens=425,088,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2215/500000] + train/ActionNoiseL2Loss=0.1003 + throughput/total_tokens=425,280,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2216/500000] + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=425,472,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2217/500000] + train/ActionNoiseL2Loss=0.1578 + throughput/total_tokens=425,664,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2218/500000] + train/ActionNoiseL2Loss=0.1190 + throughput/total_tokens=425,856,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2219/500000] + train/ActionNoiseL2Loss=0.1163 + throughput/total_tokens=426,048,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2220/500000] + optim/total_grad_norm=3.201 + train/ActionNoiseL2Loss=0.1348 + throughput/total_tokens=426,240,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2221/500000] + train/ActionNoiseL2Loss=0.1600 + throughput/total_tokens=426,432,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2222/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=426,624,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2223/500000] + train/ActionNoiseL2Loss=0.1778 + throughput/total_tokens=426,816,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2224/500000] + train/ActionNoiseL2Loss=0.1147 + throughput/total_tokens=427,008,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2225/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=427,200,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2226/500000] + train/ActionNoiseL2Loss=0.1527 + throughput/total_tokens=427,392,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2227/500000] + train/ActionNoiseL2Loss=0.1331 + throughput/total_tokens=427,584,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2228/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=427,776,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2229/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=427,968,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2230/500000] + train/ActionNoiseL2Loss=0.1225 + throughput/total_tokens=428,160,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2231/500000] + train/ActionNoiseL2Loss=0.1368 + throughput/total_tokens=428,352,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2232/500000] + train/ActionNoiseL2Loss=0.0994 + throughput/total_tokens=428,544,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2233/500000] + train/ActionNoiseL2Loss=0.0820 + throughput/total_tokens=428,736,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2234/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=428,928,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2235/500000] + train/ActionNoiseL2Loss=0.1355 + throughput/total_tokens=429,120,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2236/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=429,312,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2237/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=429,504,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2238/500000] + train/ActionNoiseL2Loss=0.1201 + throughput/total_tokens=429,696,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2239/500000] + train/ActionNoiseL2Loss=0.1063 + throughput/total_tokens=429,888,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2240/500000] + optim/total_grad_norm=2.665 + train/ActionNoiseL2Loss=0.1298 + throughput/total_tokens=430,080,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2241/500000] + train/ActionNoiseL2Loss=0.0874 + throughput/total_tokens=430,272,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2242/500000] + train/ActionNoiseL2Loss=0.0988 + throughput/total_tokens=430,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2243/500000] + train/ActionNoiseL2Loss=0.1193 + throughput/total_tokens=430,656,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2244/500000] + train/ActionNoiseL2Loss=0.1336 + throughput/total_tokens=430,848,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2245/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=431,040,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2246/500000] + train/ActionNoiseL2Loss=0.1271 + throughput/total_tokens=431,232,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2247/500000] + train/ActionNoiseL2Loss=0.1321 + throughput/total_tokens=431,424,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2248/500000] + train/ActionNoiseL2Loss=0.1402 + throughput/total_tokens=431,616,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2249/500000] + train/ActionNoiseL2Loss=0.0998 + throughput/total_tokens=431,808,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2250/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=432,000,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2251/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=432,192,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2252/500000] + train/ActionNoiseL2Loss=0.0848 + throughput/total_tokens=432,384,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2253/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=432,576,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2254/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=432,768,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2255/500000] + train/ActionNoiseL2Loss=0.0871 + throughput/total_tokens=432,960,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2256/500000] + train/ActionNoiseL2Loss=0.1077 + throughput/total_tokens=433,152,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2257/500000] + train/ActionNoiseL2Loss=0.0970 + throughput/total_tokens=433,344,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2258/500000] + train/ActionNoiseL2Loss=0.0941 + throughput/total_tokens=433,536,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2259/500000] + train/ActionNoiseL2Loss=0.1364 + throughput/total_tokens=433,728,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2260/500000] + optim/total_grad_norm=2.401 + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=433,920,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=2261/500000] + train/ActionNoiseL2Loss=0.2111 + throughput/total_tokens=434,112,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2262/500000] + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=434,304,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2263/500000] + train/ActionNoiseL2Loss=0.0967 + throughput/total_tokens=434,496,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=2264/500000] + train/ActionNoiseL2Loss=0.1865 + throughput/total_tokens=434,688,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2265/500000] + train/ActionNoiseL2Loss=0.1178 + throughput/total_tokens=434,880,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2266/500000] + train/ActionNoiseL2Loss=0.0888 + throughput/total_tokens=435,072,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2267/500000] + train/ActionNoiseL2Loss=0.1003 + throughput/total_tokens=435,264,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2268/500000] + train/ActionNoiseL2Loss=0.1091 + throughput/total_tokens=435,456,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2269/500000] + train/ActionNoiseL2Loss=0.1119 + throughput/total_tokens=435,648,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2270/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=435,840,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2271/500000] + train/ActionNoiseL2Loss=0.1004 + throughput/total_tokens=436,032,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2272/500000] + train/ActionNoiseL2Loss=0.1145 + throughput/total_tokens=436,224,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2273/500000] + train/ActionNoiseL2Loss=0.0905 + throughput/total_tokens=436,416,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2274/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=436,608,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2275/500000] + train/ActionNoiseL2Loss=0.0977 + throughput/total_tokens=436,800,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2276/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=436,992,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2277/500000] + train/ActionNoiseL2Loss=0.1267 + throughput/total_tokens=437,184,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2278/500000] + train/ActionNoiseL2Loss=0.1337 + throughput/total_tokens=437,376,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2279/500000] + train/ActionNoiseL2Loss=0.1183 + throughput/total_tokens=437,568,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2280/500000] + optim/total_grad_norm=3.002 + train/ActionNoiseL2Loss=0.0979 + throughput/total_tokens=437,760,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2281/500000] + train/ActionNoiseL2Loss=0.1509 + throughput/total_tokens=437,952,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2282/500000] + train/ActionNoiseL2Loss=0.1096 + throughput/total_tokens=438,144,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2283/500000] + train/ActionNoiseL2Loss=0.1038 + throughput/total_tokens=438,336,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2284/500000] + train/ActionNoiseL2Loss=0.0989 + throughput/total_tokens=438,528,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2285/500000] + train/ActionNoiseL2Loss=0.0931 + throughput/total_tokens=438,720,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2286/500000] + train/ActionNoiseL2Loss=0.1271 + throughput/total_tokens=438,912,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2287/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=439,104,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2288/500000] + train/ActionNoiseL2Loss=0.1149 + throughput/total_tokens=439,296,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2289/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=439,488,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2290/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=439,680,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2291/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=439,872,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2292/500000] + train/ActionNoiseL2Loss=0.1050 + throughput/total_tokens=440,064,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2293/500000] + train/ActionNoiseL2Loss=0.1034 + throughput/total_tokens=440,256,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2294/500000] + train/ActionNoiseL2Loss=0.2021 + throughput/total_tokens=440,448,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2295/500000] + train/ActionNoiseL2Loss=0.1444 + throughput/total_tokens=440,640,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2296/500000] + train/ActionNoiseL2Loss=0.1244 + throughput/total_tokens=440,832,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2297/500000] + train/ActionNoiseL2Loss=0.1130 + throughput/total_tokens=441,024,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2298/500000] + train/ActionNoiseL2Loss=0.1754 + throughput/total_tokens=441,216,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2299/500000] + train/ActionNoiseL2Loss=0.1081 + throughput/total_tokens=441,408,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2300/500000] + optim/total_grad_norm=2.822 + train/ActionNoiseL2Loss=0.1481 + throughput/total_tokens=441,600,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2301/500000] + train/ActionNoiseL2Loss=0.1172 + throughput/total_tokens=441,792,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2302/500000] + train/ActionNoiseL2Loss=0.1043 + throughput/total_tokens=441,984,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2303/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=442,176,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2304/500000] + train/ActionNoiseL2Loss=0.1969 + throughput/total_tokens=442,368,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2305/500000] + train/ActionNoiseL2Loss=0.0920 + throughput/total_tokens=442,560,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2306/500000] + train/ActionNoiseL2Loss=0.1319 + throughput/total_tokens=442,752,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2307/500000] + train/ActionNoiseL2Loss=0.1182 + throughput/total_tokens=442,944,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2308/500000] + train/ActionNoiseL2Loss=0.1145 + throughput/total_tokens=443,136,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2309/500000] + train/ActionNoiseL2Loss=0.1583 + throughput/total_tokens=443,328,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2310/500000] + train/ActionNoiseL2Loss=0.1426 + throughput/total_tokens=443,520,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=2311/500000] + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=443,712,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2312/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=443,904,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2313/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=444,096,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2314/500000] + train/ActionNoiseL2Loss=0.1254 + throughput/total_tokens=444,288,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2315/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=444,480,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2316/500000] + train/ActionNoiseL2Loss=0.1036 + throughput/total_tokens=444,672,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2317/500000] + train/ActionNoiseL2Loss=0.1070 + throughput/total_tokens=444,864,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2318/500000] + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=445,056,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2319/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=445,248,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2320/500000] + optim/total_grad_norm=2.065 + train/ActionNoiseL2Loss=0.0980 + throughput/total_tokens=445,440,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2321/500000] + train/ActionNoiseL2Loss=0.1071 + throughput/total_tokens=445,632,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2322/500000] + train/ActionNoiseL2Loss=0.0915 + throughput/total_tokens=445,824,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2323/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=446,016,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2324/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=446,208,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2325/500000] + train/ActionNoiseL2Loss=0.1406 + throughput/total_tokens=446,400,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2326/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=446,592,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2327/500000] + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=446,784,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2328/500000] + train/ActionNoiseL2Loss=0.1765 + throughput/total_tokens=446,976,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2329/500000] + train/ActionNoiseL2Loss=0.1142 + throughput/total_tokens=447,168,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2330/500000] + train/ActionNoiseL2Loss=0.0920 + throughput/total_tokens=447,360,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2331/500000] + train/ActionNoiseL2Loss=0.1289 + throughput/total_tokens=447,552,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2332/500000] + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=447,744,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2333/500000] + train/ActionNoiseL2Loss=0.1148 + throughput/total_tokens=447,936,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2334/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=448,128,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2335/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=448,320,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2336/500000] + train/ActionNoiseL2Loss=0.1438 + throughput/total_tokens=448,512,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2337/500000] + train/ActionNoiseL2Loss=0.1192 + throughput/total_tokens=448,704,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2338/500000] + train/ActionNoiseL2Loss=0.1206 + throughput/total_tokens=448,896,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2339/500000] + train/ActionNoiseL2Loss=0.1597 + throughput/total_tokens=449,088,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2340/500000] + optim/total_grad_norm=2.759 + train/ActionNoiseL2Loss=0.1068 + throughput/total_tokens=449,280,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2341/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=449,472,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2342/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=449,664,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2343/500000] + train/ActionNoiseL2Loss=0.1335 + throughput/total_tokens=449,856,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2344/500000] + train/ActionNoiseL2Loss=0.1044 + throughput/total_tokens=450,048,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2345/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=450,240,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2346/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=450,432,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2347/500000] + train/ActionNoiseL2Loss=0.1404 + throughput/total_tokens=450,624,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2348/500000] + train/ActionNoiseL2Loss=0.1729 + throughput/total_tokens=450,816,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2349/500000] + train/ActionNoiseL2Loss=0.0959 + throughput/total_tokens=451,008,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2350/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=451,200,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2351/500000] + train/ActionNoiseL2Loss=0.1839 + throughput/total_tokens=451,392,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2352/500000] + train/ActionNoiseL2Loss=0.1216 + throughput/total_tokens=451,584,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2353/500000] + train/ActionNoiseL2Loss=0.0948 + throughput/total_tokens=451,776,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2354/500000] + train/ActionNoiseL2Loss=0.1367 + throughput/total_tokens=451,968,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2355/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=452,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2356/500000] + train/ActionNoiseL2Loss=0.1391 + throughput/total_tokens=452,352,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2357/500000] + train/ActionNoiseL2Loss=0.1075 + throughput/total_tokens=452,544,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2358/500000] + train/ActionNoiseL2Loss=0.1254 + throughput/total_tokens=452,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2359/500000] + train/ActionNoiseL2Loss=0.1059 + throughput/total_tokens=452,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2360/500000] + optim/total_grad_norm=2.635 + train/ActionNoiseL2Loss=0.1362 + throughput/total_tokens=453,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=46,467 +[step=2361/500000] + train/ActionNoiseL2Loss=0.1423 + throughput/total_tokens=453,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2362/500000] + train/ActionNoiseL2Loss=0.1431 + throughput/total_tokens=453,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2363/500000] + train/ActionNoiseL2Loss=0.1067 + throughput/total_tokens=453,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2364/500000] + train/ActionNoiseL2Loss=0.1335 + throughput/total_tokens=453,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2365/500000] + train/ActionNoiseL2Loss=0.0997 + throughput/total_tokens=454,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2366/500000] + train/ActionNoiseL2Loss=0.1630 + throughput/total_tokens=454,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2367/500000] + train/ActionNoiseL2Loss=0.1194 + throughput/total_tokens=454,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2368/500000] + train/ActionNoiseL2Loss=0.0926 + throughput/total_tokens=454,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2369/500000] + train/ActionNoiseL2Loss=0.1165 + throughput/total_tokens=454,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2370/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=455,040,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2371/500000] + train/ActionNoiseL2Loss=0.0998 + throughput/total_tokens=455,232,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2372/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=455,424,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2373/500000] + train/ActionNoiseL2Loss=0.1072 + throughput/total_tokens=455,616,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2374/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=455,808,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2375/500000] + train/ActionNoiseL2Loss=0.1436 + throughput/total_tokens=456,000,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2376/500000] + train/ActionNoiseL2Loss=0.1183 + throughput/total_tokens=456,192,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2377/500000] + train/ActionNoiseL2Loss=0.1498 + throughput/total_tokens=456,384,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2378/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=456,576,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2379/500000] + train/ActionNoiseL2Loss=0.1157 + throughput/total_tokens=456,768,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2380/500000] + optim/total_grad_norm=2.253 + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=456,960,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2381/500000] + train/ActionNoiseL2Loss=0.1237 + throughput/total_tokens=457,152,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2382/500000] + train/ActionNoiseL2Loss=0.0986 + throughput/total_tokens=457,344,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2383/500000] + train/ActionNoiseL2Loss=0.1299 + throughput/total_tokens=457,536,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2384/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=457,728,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2385/500000] + train/ActionNoiseL2Loss=0.1705 + throughput/total_tokens=457,920,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2386/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=458,112,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2387/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=458,304,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2388/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=458,496,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2389/500000] + train/ActionNoiseL2Loss=0.0843 + throughput/total_tokens=458,688,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2390/500000] + train/ActionNoiseL2Loss=0.0826 + throughput/total_tokens=458,880,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2391/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=459,072,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2392/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=459,264,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2393/500000] + train/ActionNoiseL2Loss=0.0878 + throughput/total_tokens=459,456,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2394/500000] + train/ActionNoiseL2Loss=0.1215 + throughput/total_tokens=459,648,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2395/500000] + train/ActionNoiseL2Loss=0.1127 + throughput/total_tokens=459,840,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2396/500000] + train/ActionNoiseL2Loss=0.1628 + throughput/total_tokens=460,032,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2397/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=460,224,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2398/500000] + train/ActionNoiseL2Loss=0.1389 + throughput/total_tokens=460,416,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2399/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=460,608,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2400/500000] + optim/total_grad_norm=2.662 + train/ActionNoiseL2Loss=0.0892 + throughput/total_tokens=460,800,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2401/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=460,992,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=2402/500000] + train/ActionNoiseL2Loss=0.1353 + throughput/total_tokens=461,184,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2403/500000] + train/ActionNoiseL2Loss=0.1139 + throughput/total_tokens=461,376,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=2404/500000] + train/ActionNoiseL2Loss=0.1538 + throughput/total_tokens=461,568,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=2405/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=461,760,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2406/500000] + train/ActionNoiseL2Loss=0.1080 + throughput/total_tokens=461,952,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2407/500000] + train/ActionNoiseL2Loss=0.0906 + throughput/total_tokens=462,144,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2408/500000] + train/ActionNoiseL2Loss=0.1369 + throughput/total_tokens=462,336,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2409/500000] + train/ActionNoiseL2Loss=0.1154 + throughput/total_tokens=462,528,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2410/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=462,720,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2411/500000] + train/ActionNoiseL2Loss=0.1750 + throughput/total_tokens=462,912,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2412/500000] + train/ActionNoiseL2Loss=0.1040 + throughput/total_tokens=463,104,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2413/500000] + train/ActionNoiseL2Loss=0.0911 + throughput/total_tokens=463,296,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2414/500000] + train/ActionNoiseL2Loss=0.1360 + throughput/total_tokens=463,488,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2415/500000] + train/ActionNoiseL2Loss=0.1120 + throughput/total_tokens=463,680,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2416/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=463,872,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2417/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=464,064,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2418/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=464,256,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2419/500000] + train/ActionNoiseL2Loss=0.1110 + throughput/total_tokens=464,448,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2420/500000] + optim/total_grad_norm=2.591 + train/ActionNoiseL2Loss=0.1020 + throughput/total_tokens=464,640,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2421/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=464,832,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2422/500000] + train/ActionNoiseL2Loss=0.1553 + throughput/total_tokens=465,024,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2423/500000] + train/ActionNoiseL2Loss=0.1061 + throughput/total_tokens=465,216,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2424/500000] + train/ActionNoiseL2Loss=0.0989 + throughput/total_tokens=465,408,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2425/500000] + train/ActionNoiseL2Loss=0.1174 + throughput/total_tokens=465,600,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2426/500000] + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=465,792,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2427/500000] + train/ActionNoiseL2Loss=0.1235 + throughput/total_tokens=465,984,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2428/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=466,176,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2429/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=466,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2430/500000] + train/ActionNoiseL2Loss=0.1893 + throughput/total_tokens=466,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2431/500000] + train/ActionNoiseL2Loss=0.1230 + throughput/total_tokens=466,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2432/500000] + train/ActionNoiseL2Loss=0.0980 + throughput/total_tokens=466,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2433/500000] + train/ActionNoiseL2Loss=0.1418 + throughput/total_tokens=467,136,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2434/500000] + train/ActionNoiseL2Loss=0.0772 + throughput/total_tokens=467,328,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2435/500000] + train/ActionNoiseL2Loss=0.1043 + throughput/total_tokens=467,520,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2436/500000] + train/ActionNoiseL2Loss=0.0820 + throughput/total_tokens=467,712,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2437/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=467,904,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2438/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=468,096,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2439/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=468,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2440/500000] + optim/total_grad_norm=2.142 + train/ActionNoiseL2Loss=0.1063 + throughput/total_tokens=468,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2441/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=468,672,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2442/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=468,864,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2443/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=469,056,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2444/500000] + train/ActionNoiseL2Loss=0.1078 + throughput/total_tokens=469,248,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2445/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=469,440,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2446/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=469,632,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2447/500000] + train/ActionNoiseL2Loss=0.1109 + throughput/total_tokens=469,824,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2448/500000] + train/ActionNoiseL2Loss=0.0831 + throughput/total_tokens=470,016,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2449/500000] + train/ActionNoiseL2Loss=0.0851 + throughput/total_tokens=470,208,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2450/500000] + train/ActionNoiseL2Loss=0.1081 + throughput/total_tokens=470,400,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2451/500000] + train/ActionNoiseL2Loss=0.1116 + throughput/total_tokens=470,592,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=2452/500000] + train/ActionNoiseL2Loss=0.1280 + throughput/total_tokens=470,784,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2453/500000] + train/ActionNoiseL2Loss=0.0849 + throughput/total_tokens=470,976,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2454/500000] + train/ActionNoiseL2Loss=0.1474 + throughput/total_tokens=471,168,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2455/500000] + train/ActionNoiseL2Loss=0.1153 + throughput/total_tokens=471,360,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2456/500000] + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=471,552,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2457/500000] + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=471,744,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2458/500000] + train/ActionNoiseL2Loss=0.1221 + throughput/total_tokens=471,936,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2459/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=472,128,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2460/500000] + optim/total_grad_norm=2.171 + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=472,320,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=2461/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=472,512,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2462/500000] + train/ActionNoiseL2Loss=0.0878 + throughput/total_tokens=472,704,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2463/500000] + train/ActionNoiseL2Loss=0.0876 + throughput/total_tokens=472,896,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2464/500000] + train/ActionNoiseL2Loss=0.1360 + throughput/total_tokens=473,088,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2465/500000] + train/ActionNoiseL2Loss=0.0896 + throughput/total_tokens=473,280,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2466/500000] + train/ActionNoiseL2Loss=0.1707 + throughput/total_tokens=473,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2467/500000] + train/ActionNoiseL2Loss=0.1625 + throughput/total_tokens=473,664,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2468/500000] + train/ActionNoiseL2Loss=0.1124 + throughput/total_tokens=473,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2469/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=474,048,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2470/500000] + train/ActionNoiseL2Loss=0.1067 + throughput/total_tokens=474,240,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2471/500000] + train/ActionNoiseL2Loss=0.1297 + throughput/total_tokens=474,432,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2472/500000] + train/ActionNoiseL2Loss=0.1000 + throughput/total_tokens=474,624,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2473/500000] + train/ActionNoiseL2Loss=0.1022 + throughput/total_tokens=474,816,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2474/500000] + train/ActionNoiseL2Loss=0.0936 + throughput/total_tokens=475,008,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2475/500000] + train/ActionNoiseL2Loss=0.1220 + throughput/total_tokens=475,200,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2476/500000] + train/ActionNoiseL2Loss=0.1301 + throughput/total_tokens=475,392,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2477/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=475,584,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2478/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=475,776,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2479/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=475,968,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2480/500000] + optim/total_grad_norm=1.691 + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=476,160,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2481/500000] + train/ActionNoiseL2Loss=0.1108 + throughput/total_tokens=476,352,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2482/500000] + train/ActionNoiseL2Loss=0.1265 + throughput/total_tokens=476,544,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2483/500000] + train/ActionNoiseL2Loss=0.0788 + throughput/total_tokens=476,736,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2484/500000] + train/ActionNoiseL2Loss=0.1425 + throughput/total_tokens=476,928,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2485/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=477,120,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2486/500000] + train/ActionNoiseL2Loss=0.1254 + throughput/total_tokens=477,312,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2487/500000] + train/ActionNoiseL2Loss=0.0845 + throughput/total_tokens=477,504,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2488/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=477,696,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2489/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=477,888,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2490/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=478,080,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2491/500000] + train/ActionNoiseL2Loss=0.1389 + throughput/total_tokens=478,272,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2492/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=478,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2493/500000] + train/ActionNoiseL2Loss=0.0968 + throughput/total_tokens=478,656,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2494/500000] + train/ActionNoiseL2Loss=0.0818 + throughput/total_tokens=478,848,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2495/500000] + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=479,040,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2496/500000] + train/ActionNoiseL2Loss=0.0868 + throughput/total_tokens=479,232,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2497/500000] + train/ActionNoiseL2Loss=0.0790 + throughput/total_tokens=479,424,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2498/500000] + train/ActionNoiseL2Loss=0.1262 + throughput/total_tokens=479,616,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2499/500000] + train/ActionNoiseL2Loss=0.1260 + throughput/total_tokens=479,808,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2500/500000] + optim/total_grad_norm=2.869 + train/ActionNoiseL2Loss=0.1065 + throughput/total_tokens=480,000,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +10/06 [07:29:46] INFO | >> Saving config... checkpoint.py:608 +10/06 [07:30:18] INFO | >> Saving model state... checkpoint.py:796 +10/06 [07:31:30] INFO | >> Saving optim state... checkpoint.py:811 +10/06 [07:33:00] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=2501/500000] + train/ActionNoiseL2Loss=0.1054 + throughput/total_tokens=480,192,000 + throughput/device/tokens_per_second=1,188 + throughput/device/batches_per_second=0.0495 +[step=2502/500000] + train/ActionNoiseL2Loss=0.1010 + throughput/total_tokens=480,384,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=2503/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=480,576,000 + throughput/device/tokens_per_second=1,164 + throughput/device/batches_per_second=0.0485 +[step=2504/500000] + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=480,768,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=2505/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=480,960,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=2506/500000] + train/ActionNoiseL2Loss=0.1178 + throughput/total_tokens=481,152,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=2507/500000] + train/ActionNoiseL2Loss=0.1125 + throughput/total_tokens=481,344,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=2508/500000] + train/ActionNoiseL2Loss=0.1169 + throughput/total_tokens=481,536,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=2509/500000] + train/ActionNoiseL2Loss=0.0792 + throughput/total_tokens=481,728,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=2510/500000] + train/ActionNoiseL2Loss=0.0931 + throughput/total_tokens=481,920,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=2511/500000] + train/ActionNoiseL2Loss=0.1336 + throughput/total_tokens=482,112,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=2512/500000] + train/ActionNoiseL2Loss=0.1190 + throughput/total_tokens=482,304,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=2513/500000] + train/ActionNoiseL2Loss=0.1356 + throughput/total_tokens=482,496,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2514/500000] + train/ActionNoiseL2Loss=0.1036 + throughput/total_tokens=482,688,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2515/500000] + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=482,880,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2516/500000] + train/ActionNoiseL2Loss=0.1038 + throughput/total_tokens=483,072,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2517/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=483,264,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2518/500000] + train/ActionNoiseL2Loss=0.0948 + throughput/total_tokens=483,456,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2519/500000] + train/ActionNoiseL2Loss=0.1084 + throughput/total_tokens=483,648,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2520/500000] + optim/total_grad_norm=2.641 + train/ActionNoiseL2Loss=0.1042 + throughput/total_tokens=483,840,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2521/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=484,032,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2522/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=484,224,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2523/500000] + train/ActionNoiseL2Loss=0.1238 + throughput/total_tokens=484,416,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2524/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=484,608,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2525/500000] + train/ActionNoiseL2Loss=0.1003 + throughput/total_tokens=484,800,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2526/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=484,992,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2527/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=485,184,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2528/500000] + train/ActionNoiseL2Loss=0.1049 + throughput/total_tokens=485,376,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2529/500000] + train/ActionNoiseL2Loss=0.0927 + throughput/total_tokens=485,568,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2530/500000] + train/ActionNoiseL2Loss=0.0981 + throughput/total_tokens=485,760,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2531/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=485,952,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2532/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=486,144,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2533/500000] + train/ActionNoiseL2Loss=0.0999 + throughput/total_tokens=486,336,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2534/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=486,528,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2535/500000] + train/ActionNoiseL2Loss=0.1053 + throughput/total_tokens=486,720,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2536/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=486,912,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2537/500000] + train/ActionNoiseL2Loss=0.1232 + throughput/total_tokens=487,104,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2538/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=487,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2539/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=487,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2540/500000] + optim/total_grad_norm=2.002 + train/ActionNoiseL2Loss=0.1233 + throughput/total_tokens=487,680,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2541/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=487,872,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2542/500000] + train/ActionNoiseL2Loss=0.1318 + throughput/total_tokens=488,064,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2543/500000] + train/ActionNoiseL2Loss=0.1078 + throughput/total_tokens=488,256,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2544/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=488,448,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2545/500000] + train/ActionNoiseL2Loss=0.1579 + throughput/total_tokens=488,640,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2546/500000] + train/ActionNoiseL2Loss=0.1148 + throughput/total_tokens=488,832,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2547/500000] + train/ActionNoiseL2Loss=0.0899 + throughput/total_tokens=489,024,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2548/500000] + train/ActionNoiseL2Loss=0.1119 + throughput/total_tokens=489,216,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2549/500000] + train/ActionNoiseL2Loss=0.0993 + throughput/total_tokens=489,408,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2550/500000] + train/ActionNoiseL2Loss=0.1170 + throughput/total_tokens=489,600,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2551/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=489,792,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2552/500000] + train/ActionNoiseL2Loss=0.1238 + throughput/total_tokens=489,984,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2553/500000] + train/ActionNoiseL2Loss=0.0963 + throughput/total_tokens=490,176,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2554/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=490,368,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2555/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=490,560,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2556/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=490,752,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2557/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=490,944,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2558/500000] + train/ActionNoiseL2Loss=0.1060 + throughput/total_tokens=491,136,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2559/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=491,328,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2560/500000] + optim/total_grad_norm=2.477 + train/ActionNoiseL2Loss=0.1372 + throughput/total_tokens=491,520,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2561/500000] + train/ActionNoiseL2Loss=0.1696 + throughput/total_tokens=491,712,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2562/500000] + train/ActionNoiseL2Loss=0.0858 + throughput/total_tokens=491,904,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2563/500000] + train/ActionNoiseL2Loss=0.0980 + throughput/total_tokens=492,096,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2564/500000] + train/ActionNoiseL2Loss=0.1109 + throughput/total_tokens=492,288,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2565/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=492,480,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2566/500000] + train/ActionNoiseL2Loss=0.1537 + throughput/total_tokens=492,672,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2567/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=492,864,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=2568/500000] + train/ActionNoiseL2Loss=0.0991 + throughput/total_tokens=493,056,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=2569/500000] + train/ActionNoiseL2Loss=0.0836 + throughput/total_tokens=493,248,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=2570/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=493,440,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2571/500000] + train/ActionNoiseL2Loss=0.1064 + throughput/total_tokens=493,632,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2572/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=493,824,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2573/500000] + train/ActionNoiseL2Loss=0.1498 + throughput/total_tokens=494,016,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2574/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=494,208,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2575/500000] + train/ActionNoiseL2Loss=0.1251 + throughput/total_tokens=494,400,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2576/500000] + train/ActionNoiseL2Loss=0.0919 + throughput/total_tokens=494,592,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2577/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=494,784,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2578/500000] + train/ActionNoiseL2Loss=0.1349 + throughput/total_tokens=494,976,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2579/500000] + train/ActionNoiseL2Loss=0.1219 + throughput/total_tokens=495,168,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2580/500000] + optim/total_grad_norm=2.430 + train/ActionNoiseL2Loss=0.0940 + throughput/total_tokens=495,360,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2581/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=495,552,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2582/500000] + train/ActionNoiseL2Loss=0.0930 + throughput/total_tokens=495,744,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2583/500000] + train/ActionNoiseL2Loss=0.1044 + throughput/total_tokens=495,936,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2584/500000] + train/ActionNoiseL2Loss=0.0865 + throughput/total_tokens=496,128,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2585/500000] + train/ActionNoiseL2Loss=0.0809 + throughput/total_tokens=496,320,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2586/500000] + train/ActionNoiseL2Loss=0.1224 + throughput/total_tokens=496,512,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2587/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=496,704,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2588/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=496,896,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2589/500000] + train/ActionNoiseL2Loss=0.0904 + throughput/total_tokens=497,088,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2590/500000] + train/ActionNoiseL2Loss=0.1336 + throughput/total_tokens=497,280,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2591/500000] + train/ActionNoiseL2Loss=0.1476 + throughput/total_tokens=497,472,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2592/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=497,664,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2593/500000] + train/ActionNoiseL2Loss=0.1420 + throughput/total_tokens=497,856,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2594/500000] + train/ActionNoiseL2Loss=0.0916 + throughput/total_tokens=498,048,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2595/500000] + train/ActionNoiseL2Loss=0.1532 + throughput/total_tokens=498,240,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2596/500000] + train/ActionNoiseL2Loss=0.1222 + throughput/total_tokens=498,432,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2597/500000] + train/ActionNoiseL2Loss=0.1742 + throughput/total_tokens=498,624,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2598/500000] + train/ActionNoiseL2Loss=0.1174 + throughput/total_tokens=498,816,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2599/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=499,008,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2600/500000] + optim/total_grad_norm=2.461 + train/ActionNoiseL2Loss=0.1244 + throughput/total_tokens=499,200,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2601/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=499,392,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2602/500000] + train/ActionNoiseL2Loss=0.1014 + throughput/total_tokens=499,584,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=2603/500000] + train/ActionNoiseL2Loss=0.1328 + throughput/total_tokens=499,776,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2604/500000] + train/ActionNoiseL2Loss=0.0827 + throughput/total_tokens=499,968,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2605/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=500,160,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2606/500000] + train/ActionNoiseL2Loss=0.0792 + throughput/total_tokens=500,352,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2607/500000] + train/ActionNoiseL2Loss=0.0935 + throughput/total_tokens=500,544,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2608/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=500,736,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2609/500000] + train/ActionNoiseL2Loss=0.1667 + throughput/total_tokens=500,928,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2610/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=501,120,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=2611/500000] + train/ActionNoiseL2Loss=0.0998 + throughput/total_tokens=501,312,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2612/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=501,504,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2613/500000] + train/ActionNoiseL2Loss=0.1466 + throughput/total_tokens=501,696,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2614/500000] + train/ActionNoiseL2Loss=0.1536 + throughput/total_tokens=501,888,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2615/500000] + train/ActionNoiseL2Loss=0.1539 + throughput/total_tokens=502,080,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=2616/500000] + train/ActionNoiseL2Loss=0.1197 + throughput/total_tokens=502,272,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2617/500000] + train/ActionNoiseL2Loss=0.0915 + throughput/total_tokens=502,464,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2618/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=502,656,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2619/500000] + train/ActionNoiseL2Loss=0.1228 + throughput/total_tokens=502,848,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2620/500000] + optim/total_grad_norm=2.042 + train/ActionNoiseL2Loss=0.1144 + throughput/total_tokens=503,040,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2621/500000] + train/ActionNoiseL2Loss=0.1069 + throughput/total_tokens=503,232,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2622/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=503,424,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2623/500000] + train/ActionNoiseL2Loss=0.0924 + throughput/total_tokens=503,616,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2624/500000] + train/ActionNoiseL2Loss=0.1168 + throughput/total_tokens=503,808,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2625/500000] + train/ActionNoiseL2Loss=0.0999 + throughput/total_tokens=504,000,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2626/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=504,192,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2627/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=504,384,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2628/500000] + train/ActionNoiseL2Loss=0.0931 + throughput/total_tokens=504,576,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2629/500000] + train/ActionNoiseL2Loss=0.0951 + throughput/total_tokens=504,768,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2630/500000] + train/ActionNoiseL2Loss=0.1306 + throughput/total_tokens=504,960,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2631/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=505,152,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2632/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=505,344,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2633/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=505,536,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2634/500000] + train/ActionNoiseL2Loss=0.0990 + throughput/total_tokens=505,728,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2635/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=505,920,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2636/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=506,112,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=2637/500000] + train/ActionNoiseL2Loss=0.1084 + throughput/total_tokens=506,304,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2638/500000] + train/ActionNoiseL2Loss=0.1329 + throughput/total_tokens=506,496,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2639/500000] + train/ActionNoiseL2Loss=0.1034 + throughput/total_tokens=506,688,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2640/500000] + optim/total_grad_norm=1.773 + train/ActionNoiseL2Loss=0.0893 + throughput/total_tokens=506,880,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2641/500000] + train/ActionNoiseL2Loss=0.0923 + throughput/total_tokens=507,072,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2642/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=507,264,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=2643/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=507,456,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=2644/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=507,648,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=2645/500000] + train/ActionNoiseL2Loss=0.1686 + throughput/total_tokens=507,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=2646/500000] + train/ActionNoiseL2Loss=0.1534 + throughput/total_tokens=508,032,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2647/500000] + train/ActionNoiseL2Loss=0.1038 + throughput/total_tokens=508,224,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2648/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=508,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=2649/500000] + train/ActionNoiseL2Loss=0.1593 + throughput/total_tokens=508,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=2650/500000] + train/ActionNoiseL2Loss=0.0826 + throughput/total_tokens=508,800,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=2651/500000] + train/ActionNoiseL2Loss=0.0874 + throughput/total_tokens=508,992,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2652/500000] + train/ActionNoiseL2Loss=0.0982 + throughput/total_tokens=509,184,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2653/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=509,376,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2654/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=509,568,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2655/500000] + train/ActionNoiseL2Loss=0.1197 + throughput/total_tokens=509,760,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2656/500000] + train/ActionNoiseL2Loss=0.1323 + throughput/total_tokens=509,952,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2657/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=510,144,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2658/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=510,336,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2659/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=510,528,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2660/500000] + optim/total_grad_norm=2.368 + train/ActionNoiseL2Loss=0.0853 + throughput/total_tokens=510,720,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2661/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=510,912,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2662/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=511,104,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2663/500000] + train/ActionNoiseL2Loss=0.0949 + throughput/total_tokens=511,296,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2664/500000] + train/ActionNoiseL2Loss=0.1459 + throughput/total_tokens=511,488,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2665/500000] + train/ActionNoiseL2Loss=0.0877 + throughput/total_tokens=511,680,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2666/500000] + train/ActionNoiseL2Loss=0.1001 + throughput/total_tokens=511,872,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2667/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=512,064,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2668/500000] + train/ActionNoiseL2Loss=0.0907 + throughput/total_tokens=512,256,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2669/500000] + train/ActionNoiseL2Loss=0.1155 + throughput/total_tokens=512,448,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2670/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=512,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=2671/500000] + train/ActionNoiseL2Loss=0.1362 + throughput/total_tokens=512,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=2672/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=513,024,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=2673/500000] + train/ActionNoiseL2Loss=0.1633 + throughput/total_tokens=513,216,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=2674/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=513,408,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=2675/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=513,600,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2676/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=513,792,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=2677/500000] + train/ActionNoiseL2Loss=0.1275 + throughput/total_tokens=513,984,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2678/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=514,176,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2679/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=514,368,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2680/500000] + optim/total_grad_norm=1.407 + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=514,560,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2681/500000] + train/ActionNoiseL2Loss=0.0981 + throughput/total_tokens=514,752,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2682/500000] + train/ActionNoiseL2Loss=0.1072 + throughput/total_tokens=514,944,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2683/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=515,136,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2684/500000] + train/ActionNoiseL2Loss=0.1430 + throughput/total_tokens=515,328,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2685/500000] + train/ActionNoiseL2Loss=0.1608 + throughput/total_tokens=515,520,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2686/500000] + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=515,712,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2687/500000] + train/ActionNoiseL2Loss=0.1271 + throughput/total_tokens=515,904,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2688/500000] + train/ActionNoiseL2Loss=0.0994 + throughput/total_tokens=516,096,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2689/500000] + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=516,288,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2690/500000] + train/ActionNoiseL2Loss=0.0874 + throughput/total_tokens=516,480,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2691/500000] + train/ActionNoiseL2Loss=0.1065 + throughput/total_tokens=516,672,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2692/500000] + train/ActionNoiseL2Loss=0.1167 + throughput/total_tokens=516,864,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2693/500000] + train/ActionNoiseL2Loss=0.1201 + throughput/total_tokens=517,056,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2694/500000] + train/ActionNoiseL2Loss=0.0990 + throughput/total_tokens=517,248,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2695/500000] + train/ActionNoiseL2Loss=0.1193 + throughput/total_tokens=517,440,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2696/500000] + train/ActionNoiseL2Loss=0.1547 + throughput/total_tokens=517,632,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2697/500000] + train/ActionNoiseL2Loss=0.1023 + throughput/total_tokens=517,824,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2698/500000] + train/ActionNoiseL2Loss=0.1041 + throughput/total_tokens=518,016,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2699/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=518,208,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2700/500000] + optim/total_grad_norm=2.673 + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=518,400,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2701/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=518,592,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2702/500000] + train/ActionNoiseL2Loss=0.1024 + throughput/total_tokens=518,784,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2703/500000] + train/ActionNoiseL2Loss=0.1203 + throughput/total_tokens=518,976,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2704/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=519,168,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2705/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=519,360,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2706/500000] + train/ActionNoiseL2Loss=0.0901 + throughput/total_tokens=519,552,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2707/500000] + train/ActionNoiseL2Loss=0.1218 + throughput/total_tokens=519,744,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2708/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=519,936,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2709/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=520,128,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2710/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=520,320,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2711/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=520,512,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2712/500000] + train/ActionNoiseL2Loss=0.1405 + throughput/total_tokens=520,704,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2713/500000] + train/ActionNoiseL2Loss=0.1995 + throughput/total_tokens=520,896,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2714/500000] + train/ActionNoiseL2Loss=0.1613 + throughput/total_tokens=521,088,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2715/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=521,280,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2716/500000] + train/ActionNoiseL2Loss=0.0868 + throughput/total_tokens=521,472,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2717/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=521,664,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2718/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=521,856,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2719/500000] + train/ActionNoiseL2Loss=0.1106 + throughput/total_tokens=522,048,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2720/500000] + optim/total_grad_norm=2.744 + train/ActionNoiseL2Loss=0.1116 + throughput/total_tokens=522,240,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2721/500000] + train/ActionNoiseL2Loss=0.1038 + throughput/total_tokens=522,432,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2722/500000] + train/ActionNoiseL2Loss=0.1112 + throughput/total_tokens=522,624,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2723/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=522,816,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2724/500000] + train/ActionNoiseL2Loss=0.0961 + throughput/total_tokens=523,008,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2725/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=523,200,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2726/500000] + train/ActionNoiseL2Loss=0.0906 + throughput/total_tokens=523,392,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2727/500000] + train/ActionNoiseL2Loss=0.0896 + throughput/total_tokens=523,584,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2728/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=523,776,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2729/500000] + train/ActionNoiseL2Loss=0.1193 + throughput/total_tokens=523,968,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2730/500000] + train/ActionNoiseL2Loss=0.1334 + throughput/total_tokens=524,160,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2731/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=524,352,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2732/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=524,544,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2733/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=524,736,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2734/500000] + train/ActionNoiseL2Loss=0.1226 + throughput/total_tokens=524,928,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2735/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=525,120,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2736/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=525,312,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2737/500000] + train/ActionNoiseL2Loss=0.0906 + throughput/total_tokens=525,504,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2738/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=525,696,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2739/500000] + train/ActionNoiseL2Loss=0.1315 + throughput/total_tokens=525,888,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2740/500000] + optim/total_grad_norm=1.728 + train/ActionNoiseL2Loss=0.0924 + throughput/total_tokens=526,080,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2741/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=526,272,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2742/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=526,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2743/500000] + train/ActionNoiseL2Loss=0.0978 + throughput/total_tokens=526,656,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2744/500000] + train/ActionNoiseL2Loss=0.1733 + throughput/total_tokens=526,848,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2745/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=527,040,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2746/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=527,232,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2747/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=527,424,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2748/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=527,616,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2749/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=527,808,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2750/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=528,000,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2751/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=528,192,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2752/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=528,384,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2753/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=528,576,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2754/500000] + train/ActionNoiseL2Loss=0.1157 + throughput/total_tokens=528,768,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2755/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=528,960,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2756/500000] + train/ActionNoiseL2Loss=0.1090 + throughput/total_tokens=529,152,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2757/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=529,344,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2758/500000] + train/ActionNoiseL2Loss=0.1047 + throughput/total_tokens=529,536,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2759/500000] + train/ActionNoiseL2Loss=0.1269 + throughput/total_tokens=529,728,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2760/500000] + optim/total_grad_norm=3.842 + train/ActionNoiseL2Loss=0.1561 + throughput/total_tokens=529,920,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=2761/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=530,112,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2762/500000] + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=530,304,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2763/500000] + train/ActionNoiseL2Loss=0.2154 + throughput/total_tokens=530,496,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2764/500000] + train/ActionNoiseL2Loss=0.1217 + throughput/total_tokens=530,688,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2765/500000] + train/ActionNoiseL2Loss=0.1149 + throughput/total_tokens=530,880,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2766/500000] + train/ActionNoiseL2Loss=0.1073 + throughput/total_tokens=531,072,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2767/500000] + train/ActionNoiseL2Loss=0.1170 + throughput/total_tokens=531,264,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2768/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=531,456,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2769/500000] + train/ActionNoiseL2Loss=0.1041 + throughput/total_tokens=531,648,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2770/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=531,840,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2771/500000] + train/ActionNoiseL2Loss=0.1099 + throughput/total_tokens=532,032,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2772/500000] + train/ActionNoiseL2Loss=0.1319 + throughput/total_tokens=532,224,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2773/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=532,416,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2774/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=532,608,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2775/500000] + train/ActionNoiseL2Loss=0.1104 + throughput/total_tokens=532,800,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2776/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=532,992,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2777/500000] + train/ActionNoiseL2Loss=0.0934 + throughput/total_tokens=533,184,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2778/500000] + train/ActionNoiseL2Loss=0.0863 + throughput/total_tokens=533,376,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2779/500000] + train/ActionNoiseL2Loss=0.1102 + throughput/total_tokens=533,568,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2780/500000] + optim/total_grad_norm=1.904 + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=533,760,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2781/500000] + train/ActionNoiseL2Loss=0.1176 + throughput/total_tokens=533,952,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2782/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=534,144,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2783/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=534,336,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2784/500000] + train/ActionNoiseL2Loss=0.1294 + throughput/total_tokens=534,528,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2785/500000] + train/ActionNoiseL2Loss=0.1016 + throughput/total_tokens=534,720,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2786/500000] + train/ActionNoiseL2Loss=0.1120 + throughput/total_tokens=534,912,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2787/500000] + train/ActionNoiseL2Loss=0.1211 + throughput/total_tokens=535,104,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2788/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=535,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2789/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=535,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2790/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=535,680,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2791/500000] + train/ActionNoiseL2Loss=0.1361 + throughput/total_tokens=535,872,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2792/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=536,064,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2793/500000] + train/ActionNoiseL2Loss=0.1084 + throughput/total_tokens=536,256,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2794/500000] + train/ActionNoiseL2Loss=0.1203 + throughput/total_tokens=536,448,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2795/500000] + train/ActionNoiseL2Loss=0.0994 + throughput/total_tokens=536,640,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2796/500000] + train/ActionNoiseL2Loss=0.0993 + throughput/total_tokens=536,832,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2797/500000] + train/ActionNoiseL2Loss=0.1127 + throughput/total_tokens=537,024,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2798/500000] + train/ActionNoiseL2Loss=0.1021 + throughput/total_tokens=537,216,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2799/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=537,408,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2800/500000] + optim/total_grad_norm=1.845 + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=537,600,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2801/500000] + train/ActionNoiseL2Loss=0.1063 + throughput/total_tokens=537,792,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2802/500000] + train/ActionNoiseL2Loss=0.1022 + throughput/total_tokens=537,984,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2803/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=538,176,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2804/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=538,368,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2805/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=538,560,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2806/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=538,752,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2807/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=538,944,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2808/500000] + train/ActionNoiseL2Loss=0.1162 + throughput/total_tokens=539,136,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2809/500000] + train/ActionNoiseL2Loss=0.1257 + throughput/total_tokens=539,328,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2810/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=539,520,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2811/500000] + train/ActionNoiseL2Loss=0.1313 + throughput/total_tokens=539,712,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2812/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=539,904,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2813/500000] + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=540,096,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2814/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=540,288,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2815/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=540,480,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2816/500000] + train/ActionNoiseL2Loss=0.0940 + throughput/total_tokens=540,672,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2817/500000] + train/ActionNoiseL2Loss=0.1160 + throughput/total_tokens=540,864,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2818/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=541,056,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2819/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=541,248,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2820/500000] + optim/total_grad_norm=1.511 + train/ActionNoiseL2Loss=0.0894 + throughput/total_tokens=541,440,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2821/500000] + train/ActionNoiseL2Loss=0.1135 + throughput/total_tokens=541,632,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2822/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=541,824,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2823/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=542,016,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2824/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=542,208,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2825/500000] + train/ActionNoiseL2Loss=0.1838 + throughput/total_tokens=542,400,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2826/500000] + train/ActionNoiseL2Loss=0.1432 + throughput/total_tokens=542,592,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2827/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=542,784,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2828/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=542,976,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2829/500000] + train/ActionNoiseL2Loss=0.1331 + throughput/total_tokens=543,168,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2830/500000] + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=543,360,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2831/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=543,552,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2832/500000] + train/ActionNoiseL2Loss=0.1166 + throughput/total_tokens=543,744,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2833/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=543,936,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2834/500000] + train/ActionNoiseL2Loss=0.1429 + throughput/total_tokens=544,128,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2835/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=544,320,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2836/500000] + train/ActionNoiseL2Loss=0.1002 + throughput/total_tokens=544,512,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2837/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=544,704,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2838/500000] + train/ActionNoiseL2Loss=0.1169 + throughput/total_tokens=544,896,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2839/500000] + train/ActionNoiseL2Loss=0.1603 + throughput/total_tokens=545,088,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2840/500000] + optim/total_grad_norm=2.411 + train/ActionNoiseL2Loss=0.0884 + throughput/total_tokens=545,280,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2841/500000] + train/ActionNoiseL2Loss=0.1062 + throughput/total_tokens=545,472,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2842/500000] + train/ActionNoiseL2Loss=0.1014 + throughput/total_tokens=545,664,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2843/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=545,856,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2844/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=546,048,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2845/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=546,240,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2846/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=546,432,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2847/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=546,624,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2848/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=546,816,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2849/500000] + train/ActionNoiseL2Loss=0.1751 + throughput/total_tokens=547,008,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=2850/500000] + train/ActionNoiseL2Loss=0.0902 + throughput/total_tokens=547,200,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2851/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=547,392,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2852/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=547,584,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2853/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=547,776,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2854/500000] + train/ActionNoiseL2Loss=0.1639 + throughput/total_tokens=547,968,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2855/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=548,160,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2856/500000] + train/ActionNoiseL2Loss=0.1639 + throughput/total_tokens=548,352,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2857/500000] + train/ActionNoiseL2Loss=0.1004 + throughput/total_tokens=548,544,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2858/500000] + train/ActionNoiseL2Loss=0.1337 + throughput/total_tokens=548,736,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2859/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=548,928,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2860/500000] + optim/total_grad_norm=2.297 + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=549,120,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=2861/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=549,312,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2862/500000] + train/ActionNoiseL2Loss=0.1092 + throughput/total_tokens=549,504,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2863/500000] + train/ActionNoiseL2Loss=0.1322 + throughput/total_tokens=549,696,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2864/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=549,888,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2865/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=550,080,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2866/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=550,272,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2867/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=550,464,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2868/500000] + train/ActionNoiseL2Loss=0.0884 + throughput/total_tokens=550,656,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2869/500000] + train/ActionNoiseL2Loss=0.1442 + throughput/total_tokens=550,848,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2870/500000] + train/ActionNoiseL2Loss=0.0956 + throughput/total_tokens=551,040,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2871/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=551,232,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2872/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=551,424,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2873/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=551,616,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2874/500000] + train/ActionNoiseL2Loss=0.1195 + throughput/total_tokens=551,808,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2875/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=552,000,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2876/500000] + train/ActionNoiseL2Loss=0.1014 + throughput/total_tokens=552,192,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2877/500000] + train/ActionNoiseL2Loss=0.0833 + throughput/total_tokens=552,384,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2878/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=552,576,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2879/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=552,768,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2880/500000] + optim/total_grad_norm=1.422 + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=552,960,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2881/500000] + train/ActionNoiseL2Loss=0.1087 + throughput/total_tokens=553,152,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2882/500000] + train/ActionNoiseL2Loss=0.1311 + throughput/total_tokens=553,344,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2883/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=553,536,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2884/500000] + train/ActionNoiseL2Loss=0.1123 + throughput/total_tokens=553,728,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2885/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=553,920,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2886/500000] + train/ActionNoiseL2Loss=0.1082 + throughput/total_tokens=554,112,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2887/500000] + train/ActionNoiseL2Loss=0.1434 + throughput/total_tokens=554,304,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2888/500000] + train/ActionNoiseL2Loss=0.1779 + throughput/total_tokens=554,496,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2889/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=554,688,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2890/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=554,880,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2891/500000] + train/ActionNoiseL2Loss=0.1141 + throughput/total_tokens=555,072,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2892/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=555,264,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2893/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=555,456,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2894/500000] + train/ActionNoiseL2Loss=0.1018 + throughput/total_tokens=555,648,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2895/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=555,840,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2896/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=556,032,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2897/500000] + train/ActionNoiseL2Loss=0.1188 + throughput/total_tokens=556,224,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2898/500000] + train/ActionNoiseL2Loss=0.0896 + throughput/total_tokens=556,416,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2899/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=556,608,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2900/500000] + optim/total_grad_norm=1.974 + train/ActionNoiseL2Loss=0.0951 + throughput/total_tokens=556,800,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2901/500000] + train/ActionNoiseL2Loss=0.0916 + throughput/total_tokens=556,992,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2902/500000] + train/ActionNoiseL2Loss=0.1234 + throughput/total_tokens=557,184,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2903/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=557,376,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2904/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=557,568,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=2905/500000] + train/ActionNoiseL2Loss=0.1632 + throughput/total_tokens=557,760,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2906/500000] + train/ActionNoiseL2Loss=0.1053 + throughput/total_tokens=557,952,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=2907/500000] + train/ActionNoiseL2Loss=0.0884 + throughput/total_tokens=558,144,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=2908/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=558,336,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=2909/500000] + train/ActionNoiseL2Loss=0.1030 + throughput/total_tokens=558,528,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=2910/500000] + train/ActionNoiseL2Loss=0.1081 + throughput/total_tokens=558,720,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=2911/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=558,912,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=2912/500000] + train/ActionNoiseL2Loss=0.1024 + throughput/total_tokens=559,104,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=2913/500000] + train/ActionNoiseL2Loss=0.1503 + throughput/total_tokens=559,296,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2914/500000] + train/ActionNoiseL2Loss=0.1181 + throughput/total_tokens=559,488,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2915/500000] + train/ActionNoiseL2Loss=0.1579 + throughput/total_tokens=559,680,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2916/500000] + train/ActionNoiseL2Loss=0.1205 + throughput/total_tokens=559,872,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2917/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=560,064,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2918/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=560,256,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=2919/500000] + train/ActionNoiseL2Loss=0.1140 + throughput/total_tokens=560,448,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=2920/500000] + optim/total_grad_norm=1.630 + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=560,640,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2921/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=560,832,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2922/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=561,024,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2923/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=561,216,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2924/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=561,408,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2925/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=561,600,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2926/500000] + train/ActionNoiseL2Loss=0.1132 + throughput/total_tokens=561,792,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2927/500000] + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=561,984,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2928/500000] + train/ActionNoiseL2Loss=0.1065 + throughput/total_tokens=562,176,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2929/500000] + train/ActionNoiseL2Loss=0.1076 + throughput/total_tokens=562,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2930/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=562,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2931/500000] + train/ActionNoiseL2Loss=0.0922 + throughput/total_tokens=562,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2932/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=562,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2933/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=563,136,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2934/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=563,328,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2935/500000] + train/ActionNoiseL2Loss=0.1268 + throughput/total_tokens=563,520,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2936/500000] + train/ActionNoiseL2Loss=0.1003 + throughput/total_tokens=563,712,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2937/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=563,904,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2938/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=564,096,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2939/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=564,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2940/500000] + optim/total_grad_norm=1.791 + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=564,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2941/500000] + train/ActionNoiseL2Loss=0.1462 + throughput/total_tokens=564,672,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2942/500000] + train/ActionNoiseL2Loss=0.1239 + throughput/total_tokens=564,864,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2943/500000] + train/ActionNoiseL2Loss=0.0975 + throughput/total_tokens=565,056,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2944/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=565,248,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2945/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=565,440,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2946/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=565,632,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2947/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=565,824,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2948/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=566,016,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2949/500000] + train/ActionNoiseL2Loss=0.0975 + throughput/total_tokens=566,208,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2950/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=566,400,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2951/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=566,592,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2952/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=566,784,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2953/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=566,976,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2954/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=567,168,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2955/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=567,360,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2956/500000] + train/ActionNoiseL2Loss=0.0962 + throughput/total_tokens=567,552,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2957/500000] + train/ActionNoiseL2Loss=0.0909 + throughput/total_tokens=567,744,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2958/500000] + train/ActionNoiseL2Loss=0.1129 + throughput/total_tokens=567,936,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2959/500000] + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=568,128,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2960/500000] + optim/total_grad_norm=2.304 + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=568,320,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=2961/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=568,512,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2962/500000] + train/ActionNoiseL2Loss=0.0987 + throughput/total_tokens=568,704,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2963/500000] + train/ActionNoiseL2Loss=0.0948 + throughput/total_tokens=568,896,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2964/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=569,088,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2965/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=569,280,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2966/500000] + train/ActionNoiseL2Loss=0.1034 + throughput/total_tokens=569,472,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2967/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=569,664,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2968/500000] + train/ActionNoiseL2Loss=0.1477 + throughput/total_tokens=569,856,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2969/500000] + train/ActionNoiseL2Loss=0.1215 + throughput/total_tokens=570,048,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=2970/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=570,240,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2971/500000] + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=570,432,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2972/500000] + train/ActionNoiseL2Loss=0.1210 + throughput/total_tokens=570,624,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2973/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=570,816,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2974/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=571,008,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2975/500000] + train/ActionNoiseL2Loss=0.1445 + throughput/total_tokens=571,200,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=2976/500000] + train/ActionNoiseL2Loss=0.1225 + throughput/total_tokens=571,392,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2977/500000] + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=571,584,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2978/500000] + train/ActionNoiseL2Loss=0.1346 + throughput/total_tokens=571,776,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2979/500000] + train/ActionNoiseL2Loss=0.1457 + throughput/total_tokens=571,968,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2980/500000] + optim/total_grad_norm=2.319 + train/ActionNoiseL2Loss=0.1062 + throughput/total_tokens=572,160,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2981/500000] + train/ActionNoiseL2Loss=0.1560 + throughput/total_tokens=572,352,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2982/500000] + train/ActionNoiseL2Loss=0.0980 + throughput/total_tokens=572,544,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2983/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=572,736,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2984/500000] + train/ActionNoiseL2Loss=0.1019 + throughput/total_tokens=572,928,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2985/500000] + train/ActionNoiseL2Loss=0.1425 + throughput/total_tokens=573,120,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2986/500000] + train/ActionNoiseL2Loss=0.1435 + throughput/total_tokens=573,312,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2987/500000] + train/ActionNoiseL2Loss=0.0903 + throughput/total_tokens=573,504,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2988/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=573,696,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2989/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=573,888,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2990/500000] + train/ActionNoiseL2Loss=0.0872 + throughput/total_tokens=574,080,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=2991/500000] + train/ActionNoiseL2Loss=0.1374 + throughput/total_tokens=574,272,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2992/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=574,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=2993/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=574,656,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2994/500000] + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=574,848,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2995/500000] + train/ActionNoiseL2Loss=0.1038 + throughput/total_tokens=575,040,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2996/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=575,232,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2997/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=575,424,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2998/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=575,616,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=2999/500000] + train/ActionNoiseL2Loss=0.0826 + throughput/total_tokens=575,808,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3000/500000] + optim/total_grad_norm=1.827 + train/ActionNoiseL2Loss=0.1012 + throughput/total_tokens=576,000,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +10/06 [10:27:43] INFO | >> Saving config... checkpoint.py:608 +10/06 [10:28:26] INFO | >> Saving model state... checkpoint.py:796 +10/06 [10:29:37] INFO | >> Saving optim state... checkpoint.py:811 +10/06 [10:31:02] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=3001/500000] + train/ActionNoiseL2Loss=0.1029 + throughput/total_tokens=576,192,000 + throughput/device/tokens_per_second=1,191 + throughput/device/batches_per_second=0.0496 +[step=3002/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=576,384,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=3003/500000] + train/ActionNoiseL2Loss=0.0853 + throughput/total_tokens=576,576,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3004/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=576,768,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3005/500000] + train/ActionNoiseL2Loss=0.1020 + throughput/total_tokens=576,960,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3006/500000] + train/ActionNoiseL2Loss=0.1047 + throughput/total_tokens=577,152,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3007/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=577,344,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3008/500000] + train/ActionNoiseL2Loss=0.1043 + throughput/total_tokens=577,536,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3009/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=577,728,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3010/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=577,920,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3011/500000] + train/ActionNoiseL2Loss=0.1246 + throughput/total_tokens=578,112,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3012/500000] + train/ActionNoiseL2Loss=0.2527 + throughput/total_tokens=578,304,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3013/500000] + train/ActionNoiseL2Loss=0.1060 + throughput/total_tokens=578,496,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3014/500000] + train/ActionNoiseL2Loss=0.0359 + throughput/total_tokens=578,688,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3015/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=578,880,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3016/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=579,072,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3017/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=579,264,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3018/500000] + train/ActionNoiseL2Loss=0.1274 + throughput/total_tokens=579,456,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3019/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=579,648,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3020/500000] + optim/total_grad_norm=1.812 + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=579,840,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=3021/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=580,032,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3022/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=580,224,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3023/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=580,416,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3024/500000] + train/ActionNoiseL2Loss=0.0899 + throughput/total_tokens=580,608,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3025/500000] + train/ActionNoiseL2Loss=0.1263 + throughput/total_tokens=580,800,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3026/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=580,992,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3027/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=581,184,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3028/500000] + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=581,376,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3029/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=581,568,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3030/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=581,760,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3031/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=581,952,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3032/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=582,144,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3033/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=582,336,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3034/500000] + train/ActionNoiseL2Loss=0.0936 + throughput/total_tokens=582,528,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3035/500000] + train/ActionNoiseL2Loss=0.1360 + throughput/total_tokens=582,720,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3036/500000] + train/ActionNoiseL2Loss=0.1316 + throughput/total_tokens=582,912,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3037/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=583,104,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3038/500000] + train/ActionNoiseL2Loss=0.1068 + throughput/total_tokens=583,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3039/500000] + train/ActionNoiseL2Loss=0.0989 + throughput/total_tokens=583,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3040/500000] + optim/total_grad_norm=2.110 + train/ActionNoiseL2Loss=0.0950 + throughput/total_tokens=583,680,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3041/500000] + train/ActionNoiseL2Loss=0.1096 + throughput/total_tokens=583,872,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3042/500000] + train/ActionNoiseL2Loss=0.0956 + throughput/total_tokens=584,064,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3043/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=584,256,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3044/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=584,448,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3045/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=584,640,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3046/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=584,832,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3047/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=585,024,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3048/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=585,216,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3049/500000] + train/ActionNoiseL2Loss=0.0900 + throughput/total_tokens=585,408,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3050/500000] + train/ActionNoiseL2Loss=0.1202 + throughput/total_tokens=585,600,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3051/500000] + train/ActionNoiseL2Loss=0.1279 + throughput/total_tokens=585,792,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=3052/500000] + train/ActionNoiseL2Loss=0.1017 + throughput/total_tokens=585,984,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3053/500000] + train/ActionNoiseL2Loss=0.1040 + throughput/total_tokens=586,176,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3054/500000] + train/ActionNoiseL2Loss=0.0961 + throughput/total_tokens=586,368,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3055/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=586,560,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3056/500000] + train/ActionNoiseL2Loss=0.0929 + throughput/total_tokens=586,752,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3057/500000] + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=586,944,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3058/500000] + train/ActionNoiseL2Loss=0.0905 + throughput/total_tokens=587,136,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3059/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=587,328,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3060/500000] + optim/total_grad_norm=2.327 + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=587,520,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=3061/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=587,712,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3062/500000] + train/ActionNoiseL2Loss=0.0827 + throughput/total_tokens=587,904,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3063/500000] + train/ActionNoiseL2Loss=0.1584 + throughput/total_tokens=588,096,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3064/500000] + train/ActionNoiseL2Loss=0.1303 + throughput/total_tokens=588,288,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3065/500000] + train/ActionNoiseL2Loss=0.1113 + throughput/total_tokens=588,480,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3066/500000] + train/ActionNoiseL2Loss=0.1223 + throughput/total_tokens=588,672,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3067/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=588,864,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3068/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=589,056,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3069/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=589,248,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3070/500000] + train/ActionNoiseL2Loss=0.1035 + throughput/total_tokens=589,440,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3071/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=589,632,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3072/500000] + train/ActionNoiseL2Loss=0.1218 + throughput/total_tokens=589,824,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3073/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=590,016,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3074/500000] + train/ActionNoiseL2Loss=0.1797 + throughput/total_tokens=590,208,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3075/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=590,400,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3076/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=590,592,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3077/500000] + train/ActionNoiseL2Loss=0.0853 + throughput/total_tokens=590,784,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3078/500000] + train/ActionNoiseL2Loss=0.1077 + throughput/total_tokens=590,976,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3079/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=591,168,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3080/500000] + optim/total_grad_norm=1.432 + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=591,360,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3081/500000] + train/ActionNoiseL2Loss=0.0990 + throughput/total_tokens=591,552,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3082/500000] + train/ActionNoiseL2Loss=0.1150 + throughput/total_tokens=591,744,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3083/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=591,936,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3084/500000] + train/ActionNoiseL2Loss=0.0809 + throughput/total_tokens=592,128,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3085/500000] + train/ActionNoiseL2Loss=0.1453 + throughput/total_tokens=592,320,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3086/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=592,512,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3087/500000] + train/ActionNoiseL2Loss=0.1215 + throughput/total_tokens=592,704,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3088/500000] + train/ActionNoiseL2Loss=0.1007 + throughput/total_tokens=592,896,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3089/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=593,088,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3090/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=593,280,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3091/500000] + train/ActionNoiseL2Loss=0.1268 + throughput/total_tokens=593,472,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3092/500000] + train/ActionNoiseL2Loss=0.1388 + throughput/total_tokens=593,664,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3093/500000] + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=593,856,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3094/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=594,048,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3095/500000] + train/ActionNoiseL2Loss=0.0942 + throughput/total_tokens=594,240,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3096/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=594,432,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3097/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=594,624,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3098/500000] + train/ActionNoiseL2Loss=0.1055 + throughput/total_tokens=594,816,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3099/500000] + train/ActionNoiseL2Loss=0.1421 + throughput/total_tokens=595,008,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3100/500000] + optim/total_grad_norm=1.762 + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=595,200,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=3101/500000] + train/ActionNoiseL2Loss=0.1191 + throughput/total_tokens=595,392,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3102/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=595,584,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3103/500000] + train/ActionNoiseL2Loss=0.1444 + throughput/total_tokens=595,776,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3104/500000] + train/ActionNoiseL2Loss=0.1168 + throughput/total_tokens=595,968,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3105/500000] + train/ActionNoiseL2Loss=0.1171 + throughput/total_tokens=596,160,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3106/500000] + train/ActionNoiseL2Loss=0.1031 + throughput/total_tokens=596,352,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=3107/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=596,544,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3108/500000] + train/ActionNoiseL2Loss=0.0838 + throughput/total_tokens=596,736,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3109/500000] + train/ActionNoiseL2Loss=0.1026 + throughput/total_tokens=596,928,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=3110/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=597,120,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=3111/500000] + train/ActionNoiseL2Loss=0.1676 + throughput/total_tokens=597,312,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3112/500000] + train/ActionNoiseL2Loss=0.1102 + throughput/total_tokens=597,504,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3113/500000] + train/ActionNoiseL2Loss=0.1319 + throughput/total_tokens=597,696,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3114/500000] + train/ActionNoiseL2Loss=0.1316 + throughput/total_tokens=597,888,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3115/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=598,080,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3116/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=598,272,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3117/500000] + train/ActionNoiseL2Loss=0.1076 + throughput/total_tokens=598,464,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3118/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=598,656,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3119/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=598,848,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3120/500000] + optim/total_grad_norm=1.793 + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=599,040,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3121/500000] + train/ActionNoiseL2Loss=0.1271 + throughput/total_tokens=599,232,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3122/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=599,424,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3123/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=599,616,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3124/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=599,808,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3125/500000] + train/ActionNoiseL2Loss=0.1125 + throughput/total_tokens=600,000,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3126/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=600,192,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3127/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=600,384,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3128/500000] + train/ActionNoiseL2Loss=0.0943 + throughput/total_tokens=600,576,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3129/500000] + train/ActionNoiseL2Loss=0.1028 + throughput/total_tokens=600,768,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3130/500000] + train/ActionNoiseL2Loss=0.1524 + throughput/total_tokens=600,960,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3131/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=601,152,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3132/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=601,344,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3133/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=601,536,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3134/500000] + train/ActionNoiseL2Loss=0.1019 + throughput/total_tokens=601,728,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3135/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=601,920,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3136/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=602,112,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3137/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=602,304,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3138/500000] + train/ActionNoiseL2Loss=0.1160 + throughput/total_tokens=602,496,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3139/500000] + train/ActionNoiseL2Loss=0.1141 + throughput/total_tokens=602,688,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3140/500000] + optim/total_grad_norm=1.901 + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=602,880,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3141/500000] + train/ActionNoiseL2Loss=0.1667 + throughput/total_tokens=603,072,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3142/500000] + train/ActionNoiseL2Loss=0.0877 + throughput/total_tokens=603,264,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3143/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=603,456,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3144/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=603,648,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3145/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=603,840,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3146/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=604,032,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3147/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=604,224,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3148/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=604,416,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3149/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=604,608,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3150/500000] + train/ActionNoiseL2Loss=0.0866 + throughput/total_tokens=604,800,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3151/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=604,992,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=3152/500000] + train/ActionNoiseL2Loss=0.1054 + throughput/total_tokens=605,184,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3153/500000] + train/ActionNoiseL2Loss=0.1682 + throughput/total_tokens=605,376,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3154/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=605,568,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3155/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=605,760,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3156/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=605,952,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3157/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=606,144,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3158/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=606,336,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3159/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=606,528,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3160/500000] + optim/total_grad_norm=1.669 + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=606,720,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=3161/500000] + train/ActionNoiseL2Loss=0.1076 + throughput/total_tokens=606,912,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3162/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=607,104,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3163/500000] + train/ActionNoiseL2Loss=0.1133 + throughput/total_tokens=607,296,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3164/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=607,488,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3165/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=607,680,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3166/500000] + train/ActionNoiseL2Loss=0.1309 + throughput/total_tokens=607,872,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3167/500000] + train/ActionNoiseL2Loss=0.0906 + throughput/total_tokens=608,064,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3168/500000] + train/ActionNoiseL2Loss=0.1241 + throughput/total_tokens=608,256,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3169/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=608,448,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3170/500000] + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=608,640,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3171/500000] + train/ActionNoiseL2Loss=0.1295 + throughput/total_tokens=608,832,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3172/500000] + train/ActionNoiseL2Loss=0.1206 + throughput/total_tokens=609,024,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3173/500000] + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=609,216,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3174/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=609,408,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3175/500000] + train/ActionNoiseL2Loss=0.0752 + throughput/total_tokens=609,600,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3176/500000] + train/ActionNoiseL2Loss=0.1187 + throughput/total_tokens=609,792,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3177/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=609,984,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3178/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=610,176,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3179/500000] + train/ActionNoiseL2Loss=0.1045 + throughput/total_tokens=610,368,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3180/500000] + optim/total_grad_norm=1.675 + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=610,560,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3181/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=610,752,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3182/500000] + train/ActionNoiseL2Loss=0.0848 + throughput/total_tokens=610,944,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3183/500000] + train/ActionNoiseL2Loss=0.0872 + throughput/total_tokens=611,136,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3184/500000] + train/ActionNoiseL2Loss=0.1646 + throughput/total_tokens=611,328,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3185/500000] + train/ActionNoiseL2Loss=0.1130 + throughput/total_tokens=611,520,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3186/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=611,712,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3187/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=611,904,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3188/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=612,096,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3189/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=612,288,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3190/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=612,480,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3191/500000] + train/ActionNoiseL2Loss=0.1224 + throughput/total_tokens=612,672,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3192/500000] + train/ActionNoiseL2Loss=0.2077 + throughput/total_tokens=612,864,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3193/500000] + train/ActionNoiseL2Loss=0.1129 + throughput/total_tokens=613,056,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3194/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=613,248,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3195/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=613,440,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3196/500000] + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=613,632,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3197/500000] + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=613,824,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3198/500000] + train/ActionNoiseL2Loss=0.1286 + throughput/total_tokens=614,016,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3199/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=614,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3200/500000] + optim/total_grad_norm=1.829 + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=614,400,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3201/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=614,592,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3202/500000] + train/ActionNoiseL2Loss=0.0809 + throughput/total_tokens=614,784,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3203/500000] + train/ActionNoiseL2Loss=0.1152 + throughput/total_tokens=614,976,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3204/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=615,168,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3205/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=615,360,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3206/500000] + train/ActionNoiseL2Loss=0.1195 + throughput/total_tokens=615,552,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3207/500000] + train/ActionNoiseL2Loss=0.1139 + throughput/total_tokens=615,744,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3208/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=615,936,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3209/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=616,128,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3210/500000] + train/ActionNoiseL2Loss=0.1021 + throughput/total_tokens=616,320,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=3211/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=616,512,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3212/500000] + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=616,704,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3213/500000] + train/ActionNoiseL2Loss=0.1160 + throughput/total_tokens=616,896,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3214/500000] + train/ActionNoiseL2Loss=0.1610 + throughput/total_tokens=617,088,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3215/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=617,280,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3216/500000] + train/ActionNoiseL2Loss=0.1174 + throughput/total_tokens=617,472,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3217/500000] + train/ActionNoiseL2Loss=0.0907 + throughput/total_tokens=617,664,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3218/500000] + train/ActionNoiseL2Loss=0.1132 + throughput/total_tokens=617,856,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3219/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=618,048,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3220/500000] + optim/total_grad_norm=1.855 + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=618,240,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3221/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=618,432,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3222/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=618,624,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3223/500000] + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=618,816,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3224/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=619,008,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3225/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=619,200,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3226/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=619,392,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3227/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=619,584,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3228/500000] + train/ActionNoiseL2Loss=0.1815 + throughput/total_tokens=619,776,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3229/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=619,968,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3230/500000] + train/ActionNoiseL2Loss=0.1323 + throughput/total_tokens=620,160,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3231/500000] + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=620,352,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3232/500000] + train/ActionNoiseL2Loss=0.1268 + throughput/total_tokens=620,544,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3233/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=620,736,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3234/500000] + train/ActionNoiseL2Loss=0.1374 + throughput/total_tokens=620,928,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3235/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=621,120,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3236/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=621,312,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3237/500000] + train/ActionNoiseL2Loss=0.1241 + throughput/total_tokens=621,504,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3238/500000] + train/ActionNoiseL2Loss=0.1297 + throughput/total_tokens=621,696,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3239/500000] + train/ActionNoiseL2Loss=0.1079 + throughput/total_tokens=621,888,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3240/500000] + optim/total_grad_norm=2.664 + train/ActionNoiseL2Loss=0.1218 + throughput/total_tokens=622,080,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3241/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=622,272,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3242/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=622,464,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3243/500000] + train/ActionNoiseL2Loss=0.1202 + throughput/total_tokens=622,656,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3244/500000] + train/ActionNoiseL2Loss=0.1058 + throughput/total_tokens=622,848,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3245/500000] + train/ActionNoiseL2Loss=0.1003 + throughput/total_tokens=623,040,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3246/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=623,232,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3247/500000] + train/ActionNoiseL2Loss=0.0898 + throughput/total_tokens=623,424,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3248/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=623,616,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3249/500000] + train/ActionNoiseL2Loss=0.0954 + throughput/total_tokens=623,808,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3250/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=624,000,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3251/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=624,192,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3252/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=624,384,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3253/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=624,576,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3254/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=624,768,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3255/500000] + train/ActionNoiseL2Loss=0.1044 + throughput/total_tokens=624,960,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3256/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=625,152,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3257/500000] + train/ActionNoiseL2Loss=0.1148 + throughput/total_tokens=625,344,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3258/500000] + train/ActionNoiseL2Loss=0.0900 + throughput/total_tokens=625,536,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3259/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=625,728,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3260/500000] + optim/total_grad_norm=1.640 + train/ActionNoiseL2Loss=0.0924 + throughput/total_tokens=625,920,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=3261/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=626,112,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3262/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=626,304,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3263/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=626,496,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3264/500000] + train/ActionNoiseL2Loss=0.0820 + throughput/total_tokens=626,688,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3265/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=626,880,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3266/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=627,072,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3267/500000] + train/ActionNoiseL2Loss=0.1884 + throughput/total_tokens=627,264,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3268/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=627,456,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3269/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=627,648,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3270/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=627,840,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3271/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=628,032,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3272/500000] + train/ActionNoiseL2Loss=0.0962 + throughput/total_tokens=628,224,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3273/500000] + train/ActionNoiseL2Loss=0.0894 + throughput/total_tokens=628,416,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3274/500000] + train/ActionNoiseL2Loss=0.1075 + throughput/total_tokens=628,608,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3275/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=628,800,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3276/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=628,992,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3277/500000] + train/ActionNoiseL2Loss=0.1169 + throughput/total_tokens=629,184,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3278/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=629,376,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3279/500000] + train/ActionNoiseL2Loss=0.1003 + throughput/total_tokens=629,568,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3280/500000] + optim/total_grad_norm=2.272 + train/ActionNoiseL2Loss=0.1433 + throughput/total_tokens=629,760,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3281/500000] + train/ActionNoiseL2Loss=0.0874 + throughput/total_tokens=629,952,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3282/500000] + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=630,144,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3283/500000] + train/ActionNoiseL2Loss=0.1312 + throughput/total_tokens=630,336,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3284/500000] + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=630,528,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3285/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=630,720,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3286/500000] + train/ActionNoiseL2Loss=0.1668 + throughput/total_tokens=630,912,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3287/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=631,104,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3288/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=631,296,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3289/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=631,488,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3290/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=631,680,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3291/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=631,872,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3292/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=632,064,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3293/500000] + train/ActionNoiseL2Loss=0.0899 + throughput/total_tokens=632,256,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3294/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=632,448,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3295/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=632,640,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3296/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=632,832,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3297/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=633,024,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3298/500000] + train/ActionNoiseL2Loss=0.0930 + throughput/total_tokens=633,216,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3299/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=633,408,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3300/500000] + optim/total_grad_norm=1.703 + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=633,600,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3301/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=633,792,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3302/500000] + train/ActionNoiseL2Loss=0.1187 + throughput/total_tokens=633,984,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3303/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=634,176,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3304/500000] + train/ActionNoiseL2Loss=0.1773 + throughput/total_tokens=634,368,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3305/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=634,560,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3306/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=634,752,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3307/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=634,944,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3308/500000] + train/ActionNoiseL2Loss=0.1191 + throughput/total_tokens=635,136,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3309/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=635,328,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3310/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=635,520,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=3311/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=635,712,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3312/500000] + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=635,904,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3313/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=636,096,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3314/500000] + train/ActionNoiseL2Loss=0.1198 + throughput/total_tokens=636,288,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3315/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=636,480,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=3316/500000] + train/ActionNoiseL2Loss=0.1044 + throughput/total_tokens=636,672,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=3317/500000] + train/ActionNoiseL2Loss=0.1047 + throughput/total_tokens=636,864,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=3318/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=637,056,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3319/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=637,248,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3320/500000] + optim/total_grad_norm=1.998 + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=637,440,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3321/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=637,632,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3322/500000] + train/ActionNoiseL2Loss=0.1276 + throughput/total_tokens=637,824,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3323/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=638,016,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3324/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=638,208,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3325/500000] + train/ActionNoiseL2Loss=0.1438 + throughput/total_tokens=638,400,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3326/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=638,592,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3327/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=638,784,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3328/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=638,976,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3329/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=639,168,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3330/500000] + train/ActionNoiseL2Loss=0.1461 + throughput/total_tokens=639,360,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3331/500000] + train/ActionNoiseL2Loss=0.1051 + throughput/total_tokens=639,552,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3332/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=639,744,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3333/500000] + train/ActionNoiseL2Loss=0.0876 + throughput/total_tokens=639,936,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3334/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=640,128,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3335/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=640,320,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3336/500000] + train/ActionNoiseL2Loss=0.1040 + throughput/total_tokens=640,512,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3337/500000] + train/ActionNoiseL2Loss=0.0827 + throughput/total_tokens=640,704,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3338/500000] + train/ActionNoiseL2Loss=0.0951 + throughput/total_tokens=640,896,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3339/500000] + train/ActionNoiseL2Loss=0.1101 + throughput/total_tokens=641,088,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3340/500000] + optim/total_grad_norm=2.297 + train/ActionNoiseL2Loss=0.1029 + throughput/total_tokens=641,280,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3341/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=641,472,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3342/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=641,664,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3343/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=641,856,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3344/500000] + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=642,048,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3345/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=642,240,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3346/500000] + train/ActionNoiseL2Loss=0.1929 + throughput/total_tokens=642,432,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3347/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=642,624,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3348/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=642,816,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3349/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=643,008,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3350/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=643,200,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3351/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=643,392,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3352/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=643,584,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3353/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=643,776,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3354/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=643,968,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3355/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=644,160,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3356/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=644,352,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3357/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=644,544,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3358/500000] + train/ActionNoiseL2Loss=0.1993 + throughput/total_tokens=644,736,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3359/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=644,928,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3360/500000] + optim/total_grad_norm=2.146 + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=645,120,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=3361/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=645,312,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3362/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=645,504,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3363/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=645,696,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3364/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=645,888,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3365/500000] + train/ActionNoiseL2Loss=0.1600 + throughput/total_tokens=646,080,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3366/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=646,272,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3367/500000] + train/ActionNoiseL2Loss=0.1029 + throughput/total_tokens=646,464,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3368/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=646,656,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3369/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=646,848,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3370/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=647,040,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3371/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=647,232,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3372/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=647,424,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3373/500000] + train/ActionNoiseL2Loss=0.0959 + throughput/total_tokens=647,616,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3374/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=647,808,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3375/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=648,000,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3376/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=648,192,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3377/500000] + train/ActionNoiseL2Loss=0.0871 + throughput/total_tokens=648,384,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3378/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=648,576,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3379/500000] + train/ActionNoiseL2Loss=0.1025 + throughput/total_tokens=648,768,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3380/500000] + optim/total_grad_norm=2.661 + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=648,960,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3381/500000] + train/ActionNoiseL2Loss=0.0931 + throughput/total_tokens=649,152,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3382/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=649,344,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3383/500000] + train/ActionNoiseL2Loss=0.1168 + throughput/total_tokens=649,536,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3384/500000] + train/ActionNoiseL2Loss=0.0892 + throughput/total_tokens=649,728,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3385/500000] + train/ActionNoiseL2Loss=0.1153 + throughput/total_tokens=649,920,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3386/500000] + train/ActionNoiseL2Loss=0.1186 + throughput/total_tokens=650,112,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3387/500000] + train/ActionNoiseL2Loss=0.1348 + throughput/total_tokens=650,304,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3388/500000] + train/ActionNoiseL2Loss=0.1242 + throughput/total_tokens=650,496,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3389/500000] + train/ActionNoiseL2Loss=0.1095 + throughput/total_tokens=650,688,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3390/500000] + train/ActionNoiseL2Loss=0.0802 + throughput/total_tokens=650,880,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3391/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=651,072,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3392/500000] + train/ActionNoiseL2Loss=0.0931 + throughput/total_tokens=651,264,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3393/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=651,456,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3394/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=651,648,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3395/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=651,840,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3396/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=652,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3397/500000] + train/ActionNoiseL2Loss=0.1066 + throughput/total_tokens=652,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3398/500000] + train/ActionNoiseL2Loss=0.0818 + throughput/total_tokens=652,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3399/500000] + train/ActionNoiseL2Loss=0.1152 + throughput/total_tokens=652,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3400/500000] + optim/total_grad_norm=1.670 + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=652,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3401/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=652,992,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3402/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=653,184,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3403/500000] + train/ActionNoiseL2Loss=0.1018 + throughput/total_tokens=653,376,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3404/500000] + train/ActionNoiseL2Loss=0.1072 + throughput/total_tokens=653,568,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3405/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=653,760,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3406/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=653,952,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3407/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=654,144,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3408/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=654,336,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3409/500000] + train/ActionNoiseL2Loss=0.1360 + throughput/total_tokens=654,528,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3410/500000] + train/ActionNoiseL2Loss=0.1246 + throughput/total_tokens=654,720,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=3411/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=654,912,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3412/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=655,104,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3413/500000] + train/ActionNoiseL2Loss=0.0859 + throughput/total_tokens=655,296,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3414/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=655,488,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3415/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=655,680,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3416/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=655,872,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3417/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=656,064,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3418/500000] + train/ActionNoiseL2Loss=0.1216 + throughput/total_tokens=656,256,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3419/500000] + train/ActionNoiseL2Loss=0.1513 + throughput/total_tokens=656,448,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3420/500000] + optim/total_grad_norm=1.695 + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=656,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3421/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=656,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3422/500000] + train/ActionNoiseL2Loss=0.1108 + throughput/total_tokens=657,024,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3423/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=657,216,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3424/500000] + train/ActionNoiseL2Loss=0.1237 + throughput/total_tokens=657,408,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3425/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=657,600,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3426/500000] + train/ActionNoiseL2Loss=0.1519 + throughput/total_tokens=657,792,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3427/500000] + train/ActionNoiseL2Loss=0.1201 + throughput/total_tokens=657,984,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3428/500000] + train/ActionNoiseL2Loss=0.1032 + throughput/total_tokens=658,176,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3429/500000] + train/ActionNoiseL2Loss=0.1222 + throughput/total_tokens=658,368,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3430/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=658,560,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3431/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=658,752,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3432/500000] + train/ActionNoiseL2Loss=0.0939 + throughput/total_tokens=658,944,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3433/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=659,136,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3434/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=659,328,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3435/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=659,520,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3436/500000] + train/ActionNoiseL2Loss=0.1258 + throughput/total_tokens=659,712,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3437/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=659,904,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3438/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=660,096,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3439/500000] + train/ActionNoiseL2Loss=0.0999 + throughput/total_tokens=660,288,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3440/500000] + optim/total_grad_norm=1.821 + train/ActionNoiseL2Loss=0.1213 + throughput/total_tokens=660,480,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3441/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=660,672,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3442/500000] + train/ActionNoiseL2Loss=0.0918 + throughput/total_tokens=660,864,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3443/500000] + train/ActionNoiseL2Loss=0.1210 + throughput/total_tokens=661,056,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3444/500000] + train/ActionNoiseL2Loss=0.0934 + throughput/total_tokens=661,248,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3445/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=661,440,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3446/500000] + train/ActionNoiseL2Loss=0.1100 + throughput/total_tokens=661,632,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3447/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=661,824,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3448/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=662,016,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3449/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=662,208,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3450/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=662,400,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3451/500000] + train/ActionNoiseL2Loss=0.0936 + throughput/total_tokens=662,592,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=3452/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=662,784,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=3453/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=662,976,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=3454/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=663,168,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=3455/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=663,360,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=3456/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=663,552,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=3457/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=663,744,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=3458/500000] + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=663,936,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=3459/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=664,128,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=3460/500000] + optim/total_grad_norm=2.337 + train/ActionNoiseL2Loss=0.1139 + throughput/total_tokens=664,320,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=46,467 +[step=3461/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=664,512,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3462/500000] + train/ActionNoiseL2Loss=0.1070 + throughput/total_tokens=664,704,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3463/500000] + train/ActionNoiseL2Loss=0.0823 + throughput/total_tokens=664,896,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3464/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=665,088,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3465/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=665,280,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3466/500000] + train/ActionNoiseL2Loss=0.1393 + throughput/total_tokens=665,472,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3467/500000] + train/ActionNoiseL2Loss=0.1005 + throughput/total_tokens=665,664,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3468/500000] + train/ActionNoiseL2Loss=0.1102 + throughput/total_tokens=665,856,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3469/500000] + train/ActionNoiseL2Loss=0.1086 + throughput/total_tokens=666,048,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3470/500000] + train/ActionNoiseL2Loss=0.0900 + throughput/total_tokens=666,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3471/500000] + train/ActionNoiseL2Loss=0.1076 + throughput/total_tokens=666,432,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3472/500000] + train/ActionNoiseL2Loss=0.1536 + throughput/total_tokens=666,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3473/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=666,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3474/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=667,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3475/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=667,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3476/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=667,392,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3477/500000] + train/ActionNoiseL2Loss=0.0986 + throughput/total_tokens=667,584,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3478/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=667,776,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3479/500000] + train/ActionNoiseL2Loss=0.0976 + throughput/total_tokens=667,968,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3480/500000] + optim/total_grad_norm=1.732 + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=668,160,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3481/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=668,352,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3482/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=668,544,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3483/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=668,736,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3484/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=668,928,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3485/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=669,120,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3486/500000] + train/ActionNoiseL2Loss=0.1049 + throughput/total_tokens=669,312,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3487/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=669,504,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3488/500000] + train/ActionNoiseL2Loss=0.1340 + throughput/total_tokens=669,696,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3489/500000] + train/ActionNoiseL2Loss=0.1047 + throughput/total_tokens=669,888,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3490/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=670,080,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3491/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=670,272,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3492/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=670,464,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3493/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=670,656,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3494/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=670,848,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3495/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=671,040,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3496/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=671,232,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3497/500000] + train/ActionNoiseL2Loss=0.1573 + throughput/total_tokens=671,424,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3498/500000] + train/ActionNoiseL2Loss=0.1552 + throughput/total_tokens=671,616,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3499/500000] + train/ActionNoiseL2Loss=0.0968 + throughput/total_tokens=671,808,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3500/500000] + optim/total_grad_norm=1.590 + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=672,000,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +10/06 [13:25:54] INFO | >> Saving config... checkpoint.py:608 +10/06 [13:26:28] INFO | >> Saving model state... checkpoint.py:796 +10/06 [13:27:41] INFO | >> Saving optim state... checkpoint.py:811 +10/06 [13:29:15] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=3501/500000] + train/ActionNoiseL2Loss=0.0872 + throughput/total_tokens=672,192,000 + throughput/device/tokens_per_second=1,187 + throughput/device/batches_per_second=0.0495 +[step=3502/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=672,384,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3503/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=672,576,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3504/500000] + train/ActionNoiseL2Loss=0.1048 + throughput/total_tokens=672,768,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3505/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=672,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3506/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=673,152,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3507/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=673,344,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3508/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=673,536,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3509/500000] + train/ActionNoiseL2Loss=0.0872 + throughput/total_tokens=673,728,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3510/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=673,920,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=3511/500000] + train/ActionNoiseL2Loss=0.1048 + throughput/total_tokens=674,112,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3512/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=674,304,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3513/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=674,496,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3514/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=674,688,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3515/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=674,880,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3516/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=675,072,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3517/500000] + train/ActionNoiseL2Loss=0.1259 + throughput/total_tokens=675,264,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3518/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=675,456,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3519/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=675,648,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3520/500000] + optim/total_grad_norm=1.669 + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=675,840,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=3521/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=676,032,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3522/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=676,224,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3523/500000] + train/ActionNoiseL2Loss=0.1001 + throughput/total_tokens=676,416,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3524/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=676,608,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3525/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=676,800,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3526/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=676,992,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3527/500000] + train/ActionNoiseL2Loss=0.0903 + throughput/total_tokens=677,184,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3528/500000] + train/ActionNoiseL2Loss=0.0987 + throughput/total_tokens=677,376,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3529/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=677,568,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3530/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=677,760,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3531/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=677,952,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3532/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=678,144,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3533/500000] + train/ActionNoiseL2Loss=0.1654 + throughput/total_tokens=678,336,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3534/500000] + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=678,528,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3535/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=678,720,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3536/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=678,912,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3537/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=679,104,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3538/500000] + train/ActionNoiseL2Loss=0.1603 + throughput/total_tokens=679,296,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3539/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=679,488,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3540/500000] + optim/total_grad_norm=1.360 + train/ActionNoiseL2Loss=0.1004 + throughput/total_tokens=679,680,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3541/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=679,872,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3542/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=680,064,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3543/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=680,256,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3544/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=680,448,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3545/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=680,640,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3546/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=680,832,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3547/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=681,024,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3548/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=681,216,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3549/500000] + train/ActionNoiseL2Loss=0.0848 + throughput/total_tokens=681,408,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3550/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=681,600,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3551/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=681,792,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3552/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=681,984,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3553/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=682,176,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3554/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=682,368,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3555/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=682,560,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3556/500000] + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=682,752,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3557/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=682,944,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3558/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=683,136,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3559/500000] + train/ActionNoiseL2Loss=0.0831 + throughput/total_tokens=683,328,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3560/500000] + optim/total_grad_norm=1.729 + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=683,520,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=3561/500000] + train/ActionNoiseL2Loss=0.1013 + throughput/total_tokens=683,712,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3562/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=683,904,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3563/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=684,096,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3564/500000] + train/ActionNoiseL2Loss=0.0932 + throughput/total_tokens=684,288,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3565/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=684,480,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3566/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=684,672,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3567/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=684,864,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3568/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=685,056,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3569/500000] + train/ActionNoiseL2Loss=0.0999 + throughput/total_tokens=685,248,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3570/500000] + train/ActionNoiseL2Loss=0.1167 + throughput/total_tokens=685,440,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3571/500000] + train/ActionNoiseL2Loss=0.1288 + throughput/total_tokens=685,632,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3572/500000] + train/ActionNoiseL2Loss=0.1202 + throughput/total_tokens=685,824,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3573/500000] + train/ActionNoiseL2Loss=0.1110 + throughput/total_tokens=686,016,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3574/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=686,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3575/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=686,400,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3576/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=686,592,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3577/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=686,784,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3578/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=686,976,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3579/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=687,168,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3580/500000] + optim/total_grad_norm=1.526 + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=687,360,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3581/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=687,552,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3582/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=687,744,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3583/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=687,936,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3584/500000] + train/ActionNoiseL2Loss=0.1367 + throughput/total_tokens=688,128,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3585/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=688,320,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3586/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=688,512,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3587/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=688,704,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3588/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=688,896,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3589/500000] + train/ActionNoiseL2Loss=0.1658 + throughput/total_tokens=689,088,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3590/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=689,280,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3591/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=689,472,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3592/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=689,664,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3593/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=689,856,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3594/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=690,048,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3595/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=690,240,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3596/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=690,432,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3597/500000] + train/ActionNoiseL2Loss=0.0988 + throughput/total_tokens=690,624,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3598/500000] + train/ActionNoiseL2Loss=0.0993 + throughput/total_tokens=690,816,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3599/500000] + train/ActionNoiseL2Loss=0.1393 + throughput/total_tokens=691,008,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3600/500000] + optim/total_grad_norm=2.061 + train/ActionNoiseL2Loss=0.0895 + throughput/total_tokens=691,200,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3601/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=691,392,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3602/500000] + train/ActionNoiseL2Loss=0.0966 + throughput/total_tokens=691,584,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3603/500000] + train/ActionNoiseL2Loss=0.1427 + throughput/total_tokens=691,776,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3604/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=691,968,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3605/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=692,160,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3606/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=692,352,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3607/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=692,544,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3608/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=692,736,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3609/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=692,928,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3610/500000] + train/ActionNoiseL2Loss=0.1097 + throughput/total_tokens=693,120,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=3611/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=693,312,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3612/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=693,504,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3613/500000] + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=693,696,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3614/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=693,888,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3615/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=694,080,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3616/500000] + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=694,272,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3617/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=694,464,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3618/500000] + train/ActionNoiseL2Loss=0.1582 + throughput/total_tokens=694,656,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3619/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=694,848,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3620/500000] + optim/total_grad_norm=1.883 + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=695,040,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3621/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=695,232,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3622/500000] + train/ActionNoiseL2Loss=0.0258 + throughput/total_tokens=695,424,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3623/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=695,616,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3624/500000] + train/ActionNoiseL2Loss=0.1017 + throughput/total_tokens=695,808,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3625/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=696,000,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3626/500000] + train/ActionNoiseL2Loss=0.0985 + throughput/total_tokens=696,192,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3627/500000] + train/ActionNoiseL2Loss=0.1248 + throughput/total_tokens=696,384,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3628/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=696,576,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3629/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=696,768,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3630/500000] + train/ActionNoiseL2Loss=0.2074 + throughput/total_tokens=696,960,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3631/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=697,152,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3632/500000] + train/ActionNoiseL2Loss=0.1185 + throughput/total_tokens=697,344,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3633/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=697,536,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3634/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=697,728,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3635/500000] + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=697,920,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3636/500000] + train/ActionNoiseL2Loss=0.1545 + throughput/total_tokens=698,112,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3637/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=698,304,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3638/500000] + train/ActionNoiseL2Loss=0.1299 + throughput/total_tokens=698,496,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3639/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=698,688,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3640/500000] + optim/total_grad_norm=1.384 + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=698,880,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3641/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=699,072,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3642/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=699,264,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3643/500000] + train/ActionNoiseL2Loss=0.0866 + throughput/total_tokens=699,456,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3644/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=699,648,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3645/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=699,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3646/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=700,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3647/500000] + train/ActionNoiseL2Loss=0.1959 + throughput/total_tokens=700,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3648/500000] + train/ActionNoiseL2Loss=0.0776 + throughput/total_tokens=700,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3649/500000] + train/ActionNoiseL2Loss=0.1075 + throughput/total_tokens=700,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3650/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=700,800,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3651/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=700,992,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3652/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=701,184,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3653/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=701,376,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3654/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=701,568,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3655/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=701,760,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3656/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=701,952,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3657/500000] + train/ActionNoiseL2Loss=0.1014 + throughput/total_tokens=702,144,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3658/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=702,336,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3659/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=702,528,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3660/500000] + optim/total_grad_norm=2.269 + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=702,720,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=3661/500000] + train/ActionNoiseL2Loss=0.1106 + throughput/total_tokens=702,912,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3662/500000] + train/ActionNoiseL2Loss=0.1357 + throughput/total_tokens=703,104,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3663/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=703,296,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3664/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=703,488,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3665/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=703,680,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3666/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=703,872,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3667/500000] + train/ActionNoiseL2Loss=0.0941 + throughput/total_tokens=704,064,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3668/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=704,256,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3669/500000] + train/ActionNoiseL2Loss=0.0985 + throughput/total_tokens=704,448,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3670/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=704,640,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3671/500000] + train/ActionNoiseL2Loss=0.0941 + throughput/total_tokens=704,832,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3672/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=705,024,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3673/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=705,216,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3674/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=705,408,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3675/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=705,600,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3676/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=705,792,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3677/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=705,984,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3678/500000] + train/ActionNoiseL2Loss=0.1025 + throughput/total_tokens=706,176,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3679/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=706,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3680/500000] + optim/total_grad_norm=2.416 + train/ActionNoiseL2Loss=0.0975 + throughput/total_tokens=706,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3681/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=706,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3682/500000] + train/ActionNoiseL2Loss=0.1132 + throughput/total_tokens=706,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3683/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=707,136,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3684/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=707,328,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3685/500000] + train/ActionNoiseL2Loss=0.0747 + throughput/total_tokens=707,520,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3686/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=707,712,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3687/500000] + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=707,904,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3688/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=708,096,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3689/500000] + train/ActionNoiseL2Loss=0.1005 + throughput/total_tokens=708,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3690/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=708,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3691/500000] + train/ActionNoiseL2Loss=0.0709 + throughput/total_tokens=708,672,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3692/500000] + train/ActionNoiseL2Loss=0.0910 + throughput/total_tokens=708,864,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3693/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=709,056,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3694/500000] + train/ActionNoiseL2Loss=0.1241 + throughput/total_tokens=709,248,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3695/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=709,440,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3696/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=709,632,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3697/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=709,824,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3698/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=710,016,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3699/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=710,208,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3700/500000] + optim/total_grad_norm=1.497 + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=710,400,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3701/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=710,592,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3702/500000] + train/ActionNoiseL2Loss=0.1121 + throughput/total_tokens=710,784,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3703/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=710,976,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3704/500000] + train/ActionNoiseL2Loss=0.1190 + throughput/total_tokens=711,168,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3705/500000] + train/ActionNoiseL2Loss=0.1152 + throughput/total_tokens=711,360,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3706/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=711,552,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3707/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=711,744,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3708/500000] + train/ActionNoiseL2Loss=0.1107 + throughput/total_tokens=711,936,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3709/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=712,128,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3710/500000] + train/ActionNoiseL2Loss=0.0937 + throughput/total_tokens=712,320,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=3711/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=712,512,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3712/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=712,704,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3713/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=712,896,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3714/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=713,088,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3715/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=713,280,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3716/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=713,472,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3717/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=713,664,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3718/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=713,856,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3719/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=714,048,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=3720/500000] + optim/total_grad_norm=1.798 + train/ActionNoiseL2Loss=0.0959 + throughput/total_tokens=714,240,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3721/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=714,432,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3722/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=714,624,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3723/500000] + train/ActionNoiseL2Loss=0.1307 + throughput/total_tokens=714,816,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3724/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=715,008,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3725/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=715,200,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3726/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=715,392,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3727/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=715,584,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3728/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=715,776,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3729/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=715,968,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3730/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=716,160,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3731/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=716,352,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3732/500000] + train/ActionNoiseL2Loss=0.0973 + throughput/total_tokens=716,544,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3733/500000] + train/ActionNoiseL2Loss=0.1346 + throughput/total_tokens=716,736,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3734/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=716,928,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3735/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=717,120,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3736/500000] + train/ActionNoiseL2Loss=0.1052 + throughput/total_tokens=717,312,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3737/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=717,504,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3738/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=717,696,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3739/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=717,888,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3740/500000] + optim/total_grad_norm=1.670 + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=718,080,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3741/500000] + train/ActionNoiseL2Loss=0.0965 + throughput/total_tokens=718,272,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3742/500000] + train/ActionNoiseL2Loss=0.1366 + throughput/total_tokens=718,464,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3743/500000] + train/ActionNoiseL2Loss=0.0973 + throughput/total_tokens=718,656,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3744/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=718,848,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3745/500000] + train/ActionNoiseL2Loss=0.1157 + throughput/total_tokens=719,040,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3746/500000] + train/ActionNoiseL2Loss=0.1009 + throughput/total_tokens=719,232,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3747/500000] + train/ActionNoiseL2Loss=0.1008 + throughput/total_tokens=719,424,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3748/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=719,616,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3749/500000] + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=719,808,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3750/500000] + train/ActionNoiseL2Loss=0.1195 + throughput/total_tokens=720,000,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3751/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=720,192,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3752/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=720,384,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3753/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=720,576,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3754/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=720,768,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3755/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=720,960,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3756/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=721,152,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3757/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=721,344,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3758/500000] + train/ActionNoiseL2Loss=0.1017 + throughput/total_tokens=721,536,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3759/500000] + train/ActionNoiseL2Loss=0.1293 + throughput/total_tokens=721,728,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3760/500000] + optim/total_grad_norm=1.685 + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=721,920,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3761/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=722,112,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3762/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=722,304,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3763/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=722,496,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3764/500000] + train/ActionNoiseL2Loss=0.1031 + throughput/total_tokens=722,688,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3765/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=722,880,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3766/500000] + train/ActionNoiseL2Loss=0.0988 + throughput/total_tokens=723,072,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3767/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=723,264,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3768/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=723,456,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3769/500000] + train/ActionNoiseL2Loss=0.0928 + throughput/total_tokens=723,648,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3770/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=723,840,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3771/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=724,032,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3772/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=724,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3773/500000] + train/ActionNoiseL2Loss=0.1325 + throughput/total_tokens=724,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3774/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=724,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3775/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=724,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3776/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=724,992,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3777/500000] + train/ActionNoiseL2Loss=0.0943 + throughput/total_tokens=725,184,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3778/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=725,376,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3779/500000] + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=725,568,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3780/500000] + optim/total_grad_norm=1.870 + train/ActionNoiseL2Loss=0.1042 + throughput/total_tokens=725,760,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3781/500000] + train/ActionNoiseL2Loss=0.1325 + throughput/total_tokens=725,952,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3782/500000] + train/ActionNoiseL2Loss=0.1197 + throughput/total_tokens=726,144,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3783/500000] + train/ActionNoiseL2Loss=0.1296 + throughput/total_tokens=726,336,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3784/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=726,528,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3785/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=726,720,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3786/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=726,912,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3787/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=727,104,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3788/500000] + train/ActionNoiseL2Loss=0.0900 + throughput/total_tokens=727,296,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3789/500000] + train/ActionNoiseL2Loss=0.1634 + throughput/total_tokens=727,488,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3790/500000] + train/ActionNoiseL2Loss=0.1205 + throughput/total_tokens=727,680,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3791/500000] + train/ActionNoiseL2Loss=0.0957 + throughput/total_tokens=727,872,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3792/500000] + train/ActionNoiseL2Loss=0.0975 + throughput/total_tokens=728,064,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3793/500000] + train/ActionNoiseL2Loss=0.0904 + throughput/total_tokens=728,256,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3794/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=728,448,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3795/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=728,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3796/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=728,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3797/500000] + train/ActionNoiseL2Loss=0.0940 + throughput/total_tokens=729,024,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3798/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=729,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3799/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=729,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3800/500000] + optim/total_grad_norm=1.516 + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=729,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3801/500000] + train/ActionNoiseL2Loss=0.1170 + throughput/total_tokens=729,792,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3802/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=729,984,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3803/500000] + train/ActionNoiseL2Loss=0.0992 + throughput/total_tokens=730,176,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3804/500000] + train/ActionNoiseL2Loss=0.1264 + throughput/total_tokens=730,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3805/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=730,560,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3806/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=730,752,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3807/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=730,944,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3808/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=731,136,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3809/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=731,328,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3810/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=731,520,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=3811/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=731,712,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3812/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=731,904,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3813/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=732,096,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3814/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=732,288,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3815/500000] + train/ActionNoiseL2Loss=0.1010 + throughput/total_tokens=732,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3816/500000] + train/ActionNoiseL2Loss=0.0921 + throughput/total_tokens=732,672,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3817/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=732,864,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3818/500000] + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=733,056,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3819/500000] + train/ActionNoiseL2Loss=0.1147 + throughput/total_tokens=733,248,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3820/500000] + optim/total_grad_norm=2.023 + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=733,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3821/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=733,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3822/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=733,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3823/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=734,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3824/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=734,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3825/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=734,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3826/500000] + train/ActionNoiseL2Loss=0.0831 + throughput/total_tokens=734,592,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3827/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=734,784,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3828/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=734,976,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3829/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=735,168,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3830/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=735,360,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3831/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=735,552,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3832/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=735,744,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3833/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=735,936,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3834/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=736,128,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3835/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=736,320,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3836/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=736,512,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3837/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=736,704,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3838/500000] + train/ActionNoiseL2Loss=0.0977 + throughput/total_tokens=736,896,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3839/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=737,088,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3840/500000] + optim/total_grad_norm=1.524 + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=737,280,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3841/500000] + train/ActionNoiseL2Loss=0.0907 + throughput/total_tokens=737,472,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3842/500000] + train/ActionNoiseL2Loss=0.1138 + throughput/total_tokens=737,664,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3843/500000] + train/ActionNoiseL2Loss=0.1071 + throughput/total_tokens=737,856,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3844/500000] + train/ActionNoiseL2Loss=0.1144 + throughput/total_tokens=738,048,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3845/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=738,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3846/500000] + train/ActionNoiseL2Loss=0.0935 + throughput/total_tokens=738,432,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3847/500000] + train/ActionNoiseL2Loss=0.1113 + throughput/total_tokens=738,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3848/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=738,816,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3849/500000] + train/ActionNoiseL2Loss=0.1044 + throughput/total_tokens=739,008,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3850/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=739,200,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3851/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=739,392,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3852/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=739,584,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3853/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=739,776,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3854/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=739,968,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3855/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=740,160,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3856/500000] + train/ActionNoiseL2Loss=0.0914 + throughput/total_tokens=740,352,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3857/500000] + train/ActionNoiseL2Loss=0.1180 + throughput/total_tokens=740,544,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3858/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=740,736,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3859/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=740,928,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3860/500000] + optim/total_grad_norm=1.757 + train/ActionNoiseL2Loss=0.0838 + throughput/total_tokens=741,120,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=3861/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=741,312,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3862/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=741,504,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3863/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=741,696,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3864/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=741,888,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3865/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=742,080,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3866/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=742,272,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3867/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=742,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3868/500000] + train/ActionNoiseL2Loss=0.0872 + throughput/total_tokens=742,656,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3869/500000] + train/ActionNoiseL2Loss=0.0990 + throughput/total_tokens=742,848,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3870/500000] + train/ActionNoiseL2Loss=0.1366 + throughput/total_tokens=743,040,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3871/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=743,232,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3872/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=743,424,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3873/500000] + train/ActionNoiseL2Loss=0.1093 + throughput/total_tokens=743,616,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3874/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=743,808,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3875/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=744,000,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3876/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=744,192,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3877/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=744,384,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3878/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=744,576,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3879/500000] + train/ActionNoiseL2Loss=0.1084 + throughput/total_tokens=744,768,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3880/500000] + optim/total_grad_norm=3.076 + train/ActionNoiseL2Loss=0.1089 + throughput/total_tokens=744,960,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3881/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=745,152,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3882/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=745,344,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3883/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=745,536,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3884/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=745,728,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3885/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=745,920,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3886/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=746,112,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3887/500000] + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=746,304,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3888/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=746,496,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3889/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=746,688,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3890/500000] + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=746,880,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3891/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=747,072,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3892/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=747,264,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3893/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=747,456,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3894/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=747,648,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3895/500000] + train/ActionNoiseL2Loss=0.0899 + throughput/total_tokens=747,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3896/500000] + train/ActionNoiseL2Loss=0.1405 + throughput/total_tokens=748,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3897/500000] + train/ActionNoiseL2Loss=0.0824 + throughput/total_tokens=748,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3898/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=748,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3899/500000] + train/ActionNoiseL2Loss=0.0966 + throughput/total_tokens=748,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3900/500000] + optim/total_grad_norm=1.357 + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=748,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3901/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=748,992,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3902/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=749,184,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3903/500000] + train/ActionNoiseL2Loss=0.0997 + throughput/total_tokens=749,376,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3904/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=749,568,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3905/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=749,760,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3906/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=749,952,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3907/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=750,144,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3908/500000] + train/ActionNoiseL2Loss=0.1113 + throughput/total_tokens=750,336,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3909/500000] + train/ActionNoiseL2Loss=0.0915 + throughput/total_tokens=750,528,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3910/500000] + train/ActionNoiseL2Loss=0.0978 + throughput/total_tokens=750,720,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3911/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=750,912,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3912/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=751,104,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3913/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=751,296,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3914/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=751,488,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3915/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=751,680,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3916/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=751,872,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3917/500000] + train/ActionNoiseL2Loss=0.1458 + throughput/total_tokens=752,064,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3918/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=752,256,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3919/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=752,448,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3920/500000] + optim/total_grad_norm=1.236 + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=752,640,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3921/500000] + train/ActionNoiseL2Loss=0.1139 + throughput/total_tokens=752,832,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3922/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=753,024,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3923/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=753,216,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3924/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=753,408,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3925/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=753,600,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3926/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=753,792,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3927/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=753,984,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3928/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=754,176,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3929/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=754,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3930/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=754,560,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3931/500000] + train/ActionNoiseL2Loss=0.1574 + throughput/total_tokens=754,752,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=3932/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=754,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3933/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=755,136,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3934/500000] + train/ActionNoiseL2Loss=0.0977 + throughput/total_tokens=755,328,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3935/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=755,520,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3936/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=755,712,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3937/500000] + train/ActionNoiseL2Loss=0.0947 + throughput/total_tokens=755,904,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3938/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=756,096,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3939/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=756,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3940/500000] + optim/total_grad_norm=2.032 + train/ActionNoiseL2Loss=0.1343 + throughput/total_tokens=756,480,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=3941/500000] + train/ActionNoiseL2Loss=0.0902 + throughput/total_tokens=756,672,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3942/500000] + train/ActionNoiseL2Loss=0.0865 + throughput/total_tokens=756,864,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3943/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=757,056,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3944/500000] + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=757,248,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3945/500000] + train/ActionNoiseL2Loss=0.1105 + throughput/total_tokens=757,440,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3946/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=757,632,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3947/500000] + train/ActionNoiseL2Loss=0.0998 + throughput/total_tokens=757,824,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3948/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=758,016,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=3949/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=758,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3950/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=758,400,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3951/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=758,592,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3952/500000] + train/ActionNoiseL2Loss=0.1042 + throughput/total_tokens=758,784,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3953/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=758,976,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3954/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=759,168,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3955/500000] + train/ActionNoiseL2Loss=0.0984 + throughput/total_tokens=759,360,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3956/500000] + train/ActionNoiseL2Loss=0.1188 + throughput/total_tokens=759,552,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3957/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=759,744,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3958/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=759,936,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3959/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=760,128,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3960/500000] + optim/total_grad_norm=2.648 + train/ActionNoiseL2Loss=0.0858 + throughput/total_tokens=760,320,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=3961/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=760,512,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=3962/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=760,704,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3963/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=760,896,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3964/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=761,088,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3965/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=761,280,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3966/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=761,472,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3967/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=761,664,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3968/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=761,856,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3969/500000] + train/ActionNoiseL2Loss=0.0886 + throughput/total_tokens=762,048,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=3970/500000] + train/ActionNoiseL2Loss=0.1653 + throughput/total_tokens=762,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3971/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=762,432,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3972/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=762,624,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3973/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=762,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3974/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=763,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3975/500000] + train/ActionNoiseL2Loss=0.1055 + throughput/total_tokens=763,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3976/500000] + train/ActionNoiseL2Loss=0.0747 + throughput/total_tokens=763,392,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3977/500000] + train/ActionNoiseL2Loss=0.0895 + throughput/total_tokens=763,584,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3978/500000] + train/ActionNoiseL2Loss=0.0922 + throughput/total_tokens=763,776,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3979/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=763,968,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3980/500000] + optim/total_grad_norm=1.623 + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=764,160,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3981/500000] + train/ActionNoiseL2Loss=0.1170 + throughput/total_tokens=764,352,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3982/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=764,544,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3983/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=764,736,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3984/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=764,928,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3985/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=765,120,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=3986/500000] + train/ActionNoiseL2Loss=0.0831 + throughput/total_tokens=765,312,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3987/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=765,504,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=3988/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=765,696,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3989/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=765,888,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3990/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=766,080,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=3991/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=766,272,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3992/500000] + train/ActionNoiseL2Loss=0.0827 + throughput/total_tokens=766,464,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3993/500000] + train/ActionNoiseL2Loss=0.1157 + throughput/total_tokens=766,656,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3994/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=766,848,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3995/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=767,040,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3996/500000] + train/ActionNoiseL2Loss=0.0975 + throughput/total_tokens=767,232,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3997/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=767,424,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3998/500000] + train/ActionNoiseL2Loss=0.1180 + throughput/total_tokens=767,616,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=3999/500000] + train/ActionNoiseL2Loss=0.1044 + throughput/total_tokens=767,808,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4000/500000] + optim/total_grad_norm=1.816 + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=768,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +10/06 [16:24:04] INFO | >> Saving config... checkpoint.py:608 +10/06 [16:24:38] INFO | >> Saving model state... checkpoint.py:796 +10/06 [16:25:52] INFO | >> Saving optim state... checkpoint.py:811 +10/06 [16:27:19] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=4001/500000] + train/ActionNoiseL2Loss=0.1122 + throughput/total_tokens=768,192,000 + throughput/device/tokens_per_second=1,195 + throughput/device/batches_per_second=0.0498 +[step=4002/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=768,384,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=4003/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=768,576,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4004/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=768,768,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4005/500000] + train/ActionNoiseL2Loss=0.0926 + throughput/total_tokens=768,960,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4006/500000] + train/ActionNoiseL2Loss=0.1299 + throughput/total_tokens=769,152,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4007/500000] + train/ActionNoiseL2Loss=0.0868 + throughput/total_tokens=769,344,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4008/500000] + train/ActionNoiseL2Loss=0.0747 + throughput/total_tokens=769,536,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4009/500000] + train/ActionNoiseL2Loss=0.0982 + throughput/total_tokens=769,728,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4010/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=769,920,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=4011/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=770,112,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4012/500000] + train/ActionNoiseL2Loss=0.0895 + throughput/total_tokens=770,304,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4013/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=770,496,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4014/500000] + train/ActionNoiseL2Loss=0.1233 + throughput/total_tokens=770,688,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4015/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=770,880,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4016/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=771,072,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4017/500000] + train/ActionNoiseL2Loss=0.0939 + throughput/total_tokens=771,264,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4018/500000] + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=771,456,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4019/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=771,648,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4020/500000] + optim/total_grad_norm=1.620 + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=771,840,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=4021/500000] + train/ActionNoiseL2Loss=0.1688 + throughput/total_tokens=772,032,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4022/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=772,224,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4023/500000] + train/ActionNoiseL2Loss=0.1750 + throughput/total_tokens=772,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4024/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=772,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4025/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=772,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4026/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=772,992,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4027/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=773,184,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4028/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=773,376,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4029/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=773,568,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4030/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=773,760,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4031/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=773,952,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4032/500000] + train/ActionNoiseL2Loss=0.1089 + throughput/total_tokens=774,144,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4033/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=774,336,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4034/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=774,528,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4035/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=774,720,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4036/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=774,912,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4037/500000] + train/ActionNoiseL2Loss=0.0863 + throughput/total_tokens=775,104,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4038/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=775,296,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4039/500000] + train/ActionNoiseL2Loss=0.0976 + throughput/total_tokens=775,488,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4040/500000] + optim/total_grad_norm=2.239 + train/ActionNoiseL2Loss=0.1424 + throughput/total_tokens=775,680,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4041/500000] + train/ActionNoiseL2Loss=0.1513 + throughput/total_tokens=775,872,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4042/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=776,064,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4043/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=776,256,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4044/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=776,448,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4045/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=776,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4046/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=776,832,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4047/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=777,024,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4048/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=777,216,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4049/500000] + train/ActionNoiseL2Loss=0.1098 + throughput/total_tokens=777,408,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4050/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=777,600,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=4051/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=777,792,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4052/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=777,984,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4053/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=778,176,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4054/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=778,368,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4055/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=778,560,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4056/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=778,752,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4057/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=778,944,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4058/500000] + train/ActionNoiseL2Loss=0.1324 + throughput/total_tokens=779,136,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4059/500000] + train/ActionNoiseL2Loss=0.0939 + throughput/total_tokens=779,328,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4060/500000] + optim/total_grad_norm=1.960 + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=779,520,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=4061/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=779,712,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4062/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=779,904,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4063/500000] + train/ActionNoiseL2Loss=0.0947 + throughput/total_tokens=780,096,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4064/500000] + train/ActionNoiseL2Loss=0.0879 + throughput/total_tokens=780,288,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4065/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=780,480,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4066/500000] + train/ActionNoiseL2Loss=0.1129 + throughput/total_tokens=780,672,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4067/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=780,864,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4068/500000] + train/ActionNoiseL2Loss=0.1054 + throughput/total_tokens=781,056,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4069/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=781,248,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4070/500000] + train/ActionNoiseL2Loss=0.1126 + throughput/total_tokens=781,440,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4071/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=781,632,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4072/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=781,824,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4073/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=782,016,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4074/500000] + train/ActionNoiseL2Loss=0.0895 + throughput/total_tokens=782,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4075/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=782,400,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4076/500000] + train/ActionNoiseL2Loss=0.0995 + throughput/total_tokens=782,592,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4077/500000] + train/ActionNoiseL2Loss=0.0884 + throughput/total_tokens=782,784,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4078/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=782,976,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4079/500000] + train/ActionNoiseL2Loss=0.1601 + throughput/total_tokens=783,168,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4080/500000] + optim/total_grad_norm=1.767 + train/ActionNoiseL2Loss=0.0928 + throughput/total_tokens=783,360,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4081/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=783,552,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4082/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=783,744,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4083/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=783,936,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4084/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=784,128,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4085/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=784,320,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4086/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=784,512,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4087/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=784,704,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4088/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=784,896,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4089/500000] + train/ActionNoiseL2Loss=0.0832 + throughput/total_tokens=785,088,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4090/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=785,280,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4091/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=785,472,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4092/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=785,664,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4093/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=785,856,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4094/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=786,048,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4095/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=786,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4096/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=786,432,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4097/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=786,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4098/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=786,816,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4099/500000] + train/ActionNoiseL2Loss=0.1049 + throughput/total_tokens=787,008,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4100/500000] + optim/total_grad_norm=1.360 + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=787,200,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4101/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=787,392,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4102/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=787,584,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4103/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=787,776,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4104/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=787,968,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4105/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=788,160,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4106/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=788,352,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4107/500000] + train/ActionNoiseL2Loss=0.1554 + throughput/total_tokens=788,544,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4108/500000] + train/ActionNoiseL2Loss=0.1046 + throughput/total_tokens=788,736,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4109/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=788,928,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4110/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=789,120,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=4111/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=789,312,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4112/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=789,504,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4113/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=789,696,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4114/500000] + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=789,888,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4115/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=790,080,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4116/500000] + train/ActionNoiseL2Loss=0.0865 + throughput/total_tokens=790,272,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4117/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=790,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4118/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=790,656,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4119/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=790,848,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4120/500000] + optim/total_grad_norm=3.351 + train/ActionNoiseL2Loss=0.1650 + throughput/total_tokens=791,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4121/500000] + train/ActionNoiseL2Loss=0.0991 + throughput/total_tokens=791,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4122/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=791,424,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4123/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=791,616,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4124/500000] + train/ActionNoiseL2Loss=0.0863 + throughput/total_tokens=791,808,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4125/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=792,000,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4126/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=792,192,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4127/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=792,384,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4128/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=792,576,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4129/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=792,768,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4130/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=792,960,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4131/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=793,152,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4132/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=793,344,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4133/500000] + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=793,536,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4134/500000] + train/ActionNoiseL2Loss=0.0900 + throughput/total_tokens=793,728,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4135/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=793,920,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4136/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=794,112,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4137/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=794,304,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4138/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=794,496,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4139/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=794,688,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4140/500000] + optim/total_grad_norm=1.522 + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=794,880,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4141/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=795,072,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4142/500000] + train/ActionNoiseL2Loss=0.1055 + throughput/total_tokens=795,264,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4143/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=795,456,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4144/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=795,648,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4145/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=795,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4146/500000] + train/ActionNoiseL2Loss=0.0851 + throughput/total_tokens=796,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4147/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=796,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4148/500000] + train/ActionNoiseL2Loss=0.1371 + throughput/total_tokens=796,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4149/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=796,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4150/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=796,800,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4151/500000] + train/ActionNoiseL2Loss=0.1084 + throughput/total_tokens=796,992,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4152/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=797,184,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4153/500000] + train/ActionNoiseL2Loss=0.1016 + throughput/total_tokens=797,376,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4154/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=797,568,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4155/500000] + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=797,760,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4156/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=797,952,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4157/500000] + train/ActionNoiseL2Loss=0.1323 + throughput/total_tokens=798,144,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4158/500000] + train/ActionNoiseL2Loss=0.0958 + throughput/total_tokens=798,336,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4159/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=798,528,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4160/500000] + optim/total_grad_norm=1.702 + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=798,720,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=4161/500000] + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=798,912,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4162/500000] + train/ActionNoiseL2Loss=0.1319 + throughput/total_tokens=799,104,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4163/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=799,296,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4164/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=799,488,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4165/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=799,680,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4166/500000] + train/ActionNoiseL2Loss=0.0961 + throughput/total_tokens=799,872,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4167/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=800,064,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4168/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=800,256,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4169/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=800,448,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4170/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=800,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4171/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=800,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4172/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=801,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4173/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=801,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4174/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=801,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4175/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=801,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4176/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=801,792,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4177/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=801,984,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4178/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=802,176,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4179/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=802,368,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4180/500000] + optim/total_grad_norm=1.301 + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=802,560,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4181/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=802,752,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4182/500000] + train/ActionNoiseL2Loss=0.0935 + throughput/total_tokens=802,944,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4183/500000] + train/ActionNoiseL2Loss=0.1130 + throughput/total_tokens=803,136,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4184/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=803,328,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4185/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=803,520,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4186/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=803,712,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4187/500000] + train/ActionNoiseL2Loss=0.1146 + throughput/total_tokens=803,904,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4188/500000] + train/ActionNoiseL2Loss=0.1017 + throughput/total_tokens=804,096,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4189/500000] + train/ActionNoiseL2Loss=0.1202 + throughput/total_tokens=804,288,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4190/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=804,480,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4191/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=804,672,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4192/500000] + train/ActionNoiseL2Loss=0.0848 + throughput/total_tokens=804,864,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4193/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=805,056,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4194/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=805,248,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4195/500000] + train/ActionNoiseL2Loss=0.0832 + throughput/total_tokens=805,440,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4196/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=805,632,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4197/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=805,824,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4198/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=806,016,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4199/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=806,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4200/500000] + optim/total_grad_norm=1.685 + train/ActionNoiseL2Loss=0.1088 + throughput/total_tokens=806,400,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4201/500000] + train/ActionNoiseL2Loss=0.1251 + throughput/total_tokens=806,592,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4202/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=806,784,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4203/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=806,976,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4204/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=807,168,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4205/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=807,360,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4206/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=807,552,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4207/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=807,744,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4208/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=807,936,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4209/500000] + train/ActionNoiseL2Loss=0.1345 + throughput/total_tokens=808,128,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4210/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=808,320,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=4211/500000] + train/ActionNoiseL2Loss=0.0335 + throughput/total_tokens=808,512,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4212/500000] + train/ActionNoiseL2Loss=0.1241 + throughput/total_tokens=808,704,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4213/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=808,896,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4214/500000] + train/ActionNoiseL2Loss=0.0410 + throughput/total_tokens=809,088,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4215/500000] + train/ActionNoiseL2Loss=0.1104 + throughput/total_tokens=809,280,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4216/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=809,472,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4217/500000] + train/ActionNoiseL2Loss=0.0975 + throughput/total_tokens=809,664,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4218/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=809,856,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4219/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=810,048,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4220/500000] + optim/total_grad_norm=1.175 + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=810,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4221/500000] + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=810,432,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4222/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=810,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4223/500000] + train/ActionNoiseL2Loss=0.0971 + throughput/total_tokens=810,816,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4224/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=811,008,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4225/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=811,200,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4226/500000] + train/ActionNoiseL2Loss=0.0969 + throughput/total_tokens=811,392,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4227/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=811,584,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4228/500000] + train/ActionNoiseL2Loss=0.0818 + throughput/total_tokens=811,776,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4229/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=811,968,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4230/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=812,160,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4231/500000] + train/ActionNoiseL2Loss=0.1003 + throughput/total_tokens=812,352,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4232/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=812,544,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4233/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=812,736,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4234/500000] + train/ActionNoiseL2Loss=0.1040 + throughput/total_tokens=812,928,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4235/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=813,120,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4236/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=813,312,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4237/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=813,504,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4238/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=813,696,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4239/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=813,888,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4240/500000] + optim/total_grad_norm=1.582 + train/ActionNoiseL2Loss=0.1124 + throughput/total_tokens=814,080,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4241/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=814,272,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4242/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=814,464,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4243/500000] + train/ActionNoiseL2Loss=0.1647 + throughput/total_tokens=814,656,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4244/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=814,848,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4245/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=815,040,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4246/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=815,232,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4247/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=815,424,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4248/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=815,616,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4249/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=815,808,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4250/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=816,000,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4251/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=816,192,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4252/500000] + train/ActionNoiseL2Loss=0.1325 + throughput/total_tokens=816,384,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4253/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=816,576,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4254/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=816,768,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4255/500000] + train/ActionNoiseL2Loss=0.1199 + throughput/total_tokens=816,960,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4256/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=817,152,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4257/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=817,344,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4258/500000] + train/ActionNoiseL2Loss=0.0785 + throughput/total_tokens=817,536,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4259/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=817,728,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4260/500000] + optim/total_grad_norm=1.327 + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=817,920,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=4261/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=818,112,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4262/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=818,304,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4263/500000] + train/ActionNoiseL2Loss=0.1061 + throughput/total_tokens=818,496,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4264/500000] + train/ActionNoiseL2Loss=0.1026 + throughput/total_tokens=818,688,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4265/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=818,880,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4266/500000] + train/ActionNoiseL2Loss=0.0843 + throughput/total_tokens=819,072,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4267/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=819,264,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4268/500000] + train/ActionNoiseL2Loss=0.1109 + throughput/total_tokens=819,456,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4269/500000] + train/ActionNoiseL2Loss=0.0996 + throughput/total_tokens=819,648,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4270/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=819,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4271/500000] + train/ActionNoiseL2Loss=0.1003 + throughput/total_tokens=820,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4272/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=820,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4273/500000] + train/ActionNoiseL2Loss=0.1095 + throughput/total_tokens=820,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4274/500000] + train/ActionNoiseL2Loss=0.1500 + throughput/total_tokens=820,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4275/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=820,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4276/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=820,992,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4277/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=821,184,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4278/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=821,376,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4279/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=821,568,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4280/500000] + optim/total_grad_norm=1.971 + train/ActionNoiseL2Loss=0.1310 + throughput/total_tokens=821,760,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4281/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=821,952,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4282/500000] + train/ActionNoiseL2Loss=0.1137 + throughput/total_tokens=822,144,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4283/500000] + train/ActionNoiseL2Loss=0.0985 + throughput/total_tokens=822,336,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4284/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=822,528,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4285/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=822,720,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4286/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=822,912,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4287/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=823,104,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4288/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=823,296,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4289/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=823,488,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4290/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=823,680,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4291/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=823,872,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4292/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=824,064,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4293/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=824,256,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4294/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=824,448,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4295/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=824,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4296/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=824,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4297/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=825,024,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4298/500000] + train/ActionNoiseL2Loss=0.0388 + throughput/total_tokens=825,216,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4299/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=825,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4300/500000] + optim/total_grad_norm=1.613 + train/ActionNoiseL2Loss=0.0871 + throughput/total_tokens=825,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4301/500000] + train/ActionNoiseL2Loss=0.0332 + throughput/total_tokens=825,792,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4302/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=825,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4303/500000] + train/ActionNoiseL2Loss=0.1150 + throughput/total_tokens=826,176,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4304/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=826,368,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4305/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=826,560,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4306/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=826,752,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4307/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=826,944,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4308/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=827,136,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4309/500000] + train/ActionNoiseL2Loss=0.0329 + throughput/total_tokens=827,328,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4310/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=827,520,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=46,467 +[step=4311/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=827,712,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4312/500000] + train/ActionNoiseL2Loss=0.0998 + throughput/total_tokens=827,904,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4313/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=828,096,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4314/500000] + train/ActionNoiseL2Loss=0.0991 + throughput/total_tokens=828,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4315/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=828,480,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4316/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=828,672,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4317/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=828,864,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4318/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=829,056,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4319/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=829,248,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4320/500000] + optim/total_grad_norm=1.511 + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=829,440,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4321/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=829,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4322/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=829,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4323/500000] + train/ActionNoiseL2Loss=0.1368 + throughput/total_tokens=830,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4324/500000] + train/ActionNoiseL2Loss=0.0997 + throughput/total_tokens=830,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4325/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=830,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4326/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=830,592,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4327/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=830,784,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4328/500000] + train/ActionNoiseL2Loss=0.1067 + throughput/total_tokens=830,976,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4329/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=831,168,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4330/500000] + train/ActionNoiseL2Loss=0.0903 + throughput/total_tokens=831,360,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4331/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=831,552,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4332/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=831,744,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4333/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=831,936,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4334/500000] + train/ActionNoiseL2Loss=0.1090 + throughput/total_tokens=832,128,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4335/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=832,320,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4336/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=832,512,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4337/500000] + train/ActionNoiseL2Loss=0.0984 + throughput/total_tokens=832,704,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4338/500000] + train/ActionNoiseL2Loss=0.1498 + throughput/total_tokens=832,896,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4339/500000] + train/ActionNoiseL2Loss=0.1184 + throughput/total_tokens=833,088,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4340/500000] + optim/total_grad_norm=2.013 + train/ActionNoiseL2Loss=0.1144 + throughput/total_tokens=833,280,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4341/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=833,472,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4342/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=833,664,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4343/500000] + train/ActionNoiseL2Loss=0.0995 + throughput/total_tokens=833,856,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4344/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=834,048,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4345/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=834,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4346/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=834,432,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4347/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=834,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4348/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=834,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4349/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=835,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4350/500000] + train/ActionNoiseL2Loss=0.0989 + throughput/total_tokens=835,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4351/500000] + train/ActionNoiseL2Loss=0.0410 + throughput/total_tokens=835,392,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4352/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=835,584,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4353/500000] + train/ActionNoiseL2Loss=0.1132 + throughput/total_tokens=835,776,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4354/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=835,968,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4355/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=836,160,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4356/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=836,352,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4357/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=836,544,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4358/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=836,736,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4359/500000] + train/ActionNoiseL2Loss=0.1367 + throughput/total_tokens=836,928,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4360/500000] + optim/total_grad_norm=1.397 + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=837,120,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=4361/500000] + train/ActionNoiseL2Loss=0.0916 + throughput/total_tokens=837,312,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4362/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=837,504,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4363/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=837,696,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4364/500000] + train/ActionNoiseL2Loss=0.0981 + throughput/total_tokens=837,888,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4365/500000] + train/ActionNoiseL2Loss=0.1924 + throughput/total_tokens=838,080,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4366/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=838,272,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4367/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=838,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4368/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=838,656,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4369/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=838,848,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4370/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=839,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4371/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=839,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4372/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=839,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4373/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=839,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4374/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=839,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4375/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=840,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4376/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=840,192,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4377/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=840,384,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4378/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=840,576,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4379/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=840,768,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4380/500000] + optim/total_grad_norm=1.265 + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=840,960,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4381/500000] + train/ActionNoiseL2Loss=0.1046 + throughput/total_tokens=841,152,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4382/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=841,344,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4383/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=841,536,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4384/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=841,728,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4385/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=841,920,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4386/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=842,112,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4387/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=842,304,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4388/500000] + train/ActionNoiseL2Loss=0.1096 + throughput/total_tokens=842,496,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4389/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=842,688,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4390/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=842,880,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4391/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=843,072,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4392/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=843,264,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4393/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=843,456,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4394/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=843,648,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4395/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=843,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4396/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=844,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4397/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=844,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4398/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=844,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4399/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=844,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4400/500000] + optim/total_grad_norm=2.150 + train/ActionNoiseL2Loss=0.1112 + throughput/total_tokens=844,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4401/500000] + train/ActionNoiseL2Loss=0.1225 + throughput/total_tokens=844,992,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4402/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=845,184,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4403/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=845,376,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4404/500000] + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=845,568,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4405/500000] + train/ActionNoiseL2Loss=0.1128 + throughput/total_tokens=845,760,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4406/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=845,952,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4407/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=846,144,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4408/500000] + train/ActionNoiseL2Loss=0.1380 + throughput/total_tokens=846,336,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4409/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=846,528,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4410/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=846,720,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=4411/500000] + train/ActionNoiseL2Loss=0.1162 + throughput/total_tokens=846,912,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4412/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=847,104,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4413/500000] + train/ActionNoiseL2Loss=0.0940 + throughput/total_tokens=847,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4414/500000] + train/ActionNoiseL2Loss=0.1170 + throughput/total_tokens=847,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4415/500000] + train/ActionNoiseL2Loss=0.1807 + throughput/total_tokens=847,680,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4416/500000] + train/ActionNoiseL2Loss=0.1024 + throughput/total_tokens=847,872,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4417/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=848,064,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4418/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=848,256,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4419/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=848,448,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4420/500000] + optim/total_grad_norm=2.807 + train/ActionNoiseL2Loss=0.1167 + throughput/total_tokens=848,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4421/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=848,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4422/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=849,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4423/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=849,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4424/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=849,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4425/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=849,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4426/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=849,792,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4427/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=849,984,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4428/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=850,176,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4429/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=850,368,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4430/500000] + train/ActionNoiseL2Loss=0.1413 + throughput/total_tokens=850,560,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4431/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=850,752,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4432/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=850,944,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4433/500000] + train/ActionNoiseL2Loss=0.0866 + throughput/total_tokens=851,136,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4434/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=851,328,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4435/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=851,520,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4436/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=851,712,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4437/500000] + train/ActionNoiseL2Loss=0.1199 + throughput/total_tokens=851,904,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4438/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=852,096,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4439/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=852,288,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4440/500000] + optim/total_grad_norm=1.764 + train/ActionNoiseL2Loss=0.0871 + throughput/total_tokens=852,480,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4441/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=852,672,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4442/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=852,864,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4443/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=853,056,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4444/500000] + train/ActionNoiseL2Loss=0.1582 + throughput/total_tokens=853,248,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4445/500000] + train/ActionNoiseL2Loss=0.0904 + throughput/total_tokens=853,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4446/500000] + train/ActionNoiseL2Loss=0.0370 + throughput/total_tokens=853,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4447/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=853,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4448/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=854,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4449/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=854,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4450/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=854,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4451/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=854,592,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4452/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=854,784,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4453/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=854,976,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4454/500000] + train/ActionNoiseL2Loss=0.1005 + throughput/total_tokens=855,168,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4455/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=855,360,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4456/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=855,552,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4457/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=855,744,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4458/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=855,936,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4459/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=856,128,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4460/500000] + optim/total_grad_norm=1.393 + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=856,320,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=4461/500000] + train/ActionNoiseL2Loss=0.0809 + throughput/total_tokens=856,512,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4462/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=856,704,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4463/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=856,896,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4464/500000] + train/ActionNoiseL2Loss=0.1008 + throughput/total_tokens=857,088,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4465/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=857,280,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4466/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=857,472,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4467/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=857,664,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4468/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=857,856,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4469/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=858,048,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4470/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=858,240,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4471/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=858,432,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4472/500000] + train/ActionNoiseL2Loss=0.1230 + throughput/total_tokens=858,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4473/500000] + train/ActionNoiseL2Loss=0.1098 + throughput/total_tokens=858,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4474/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=859,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4475/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=859,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4476/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=859,392,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4477/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=859,584,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4478/500000] + train/ActionNoiseL2Loss=0.0994 + throughput/total_tokens=859,776,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4479/500000] + train/ActionNoiseL2Loss=0.0919 + throughput/total_tokens=859,968,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4480/500000] + optim/total_grad_norm=1.005 + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=860,160,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4481/500000] + train/ActionNoiseL2Loss=0.1062 + throughput/total_tokens=860,352,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4482/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=860,544,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4483/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=860,736,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4484/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=860,928,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4485/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=861,120,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4486/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=861,312,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4487/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=861,504,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4488/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=861,696,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4489/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=861,888,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4490/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=862,080,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4491/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=862,272,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4492/500000] + train/ActionNoiseL2Loss=0.0268 + throughput/total_tokens=862,464,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4493/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=862,656,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4494/500000] + train/ActionNoiseL2Loss=0.0343 + throughput/total_tokens=862,848,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4495/500000] + train/ActionNoiseL2Loss=0.0958 + throughput/total_tokens=863,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4496/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=863,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4497/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=863,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4498/500000] + train/ActionNoiseL2Loss=0.1700 + throughput/total_tokens=863,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4499/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=863,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4500/500000] + optim/total_grad_norm=0.9920 + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=864,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +10/06 [19:22:03] INFO | >> Saving config... checkpoint.py:608 +10/06 [19:22:37] INFO | >> Saving model state... checkpoint.py:796 +10/06 [19:23:51] INFO | >> Saving optim state... checkpoint.py:811 +10/06 [19:25:19] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=4501/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=864,192,000 + throughput/device/tokens_per_second=1,189 + throughput/device/batches_per_second=0.0496 +[step=4502/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=864,384,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=4503/500000] + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=864,576,000 + throughput/device/tokens_per_second=1,163 + throughput/device/batches_per_second=0.0485 +[step=4504/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=864,768,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=4505/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=864,960,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=4506/500000] + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=865,152,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4507/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=865,344,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4508/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=865,536,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4509/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=865,728,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4510/500000] + train/ActionNoiseL2Loss=0.1052 + throughput/total_tokens=865,920,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4511/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=866,112,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4512/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=866,304,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4513/500000] + train/ActionNoiseL2Loss=0.0411 + throughput/total_tokens=866,496,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4514/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=866,688,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4515/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=866,880,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4516/500000] + train/ActionNoiseL2Loss=0.0997 + throughput/total_tokens=867,072,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4517/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=867,264,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4518/500000] + train/ActionNoiseL2Loss=0.1152 + throughput/total_tokens=867,456,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4519/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=867,648,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4520/500000] + optim/total_grad_norm=0.9414 + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=867,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4521/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=868,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4522/500000] + train/ActionNoiseL2Loss=0.0886 + throughput/total_tokens=868,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4523/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=868,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4524/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=868,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4525/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=868,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4526/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=868,992,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4527/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=869,184,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4528/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=869,376,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4529/500000] + train/ActionNoiseL2Loss=0.0899 + throughput/total_tokens=869,568,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4530/500000] + train/ActionNoiseL2Loss=0.0914 + throughput/total_tokens=869,760,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4531/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=869,952,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4532/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=870,144,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4533/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=870,336,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4534/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=870,528,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4535/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=870,720,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4536/500000] + train/ActionNoiseL2Loss=0.1007 + throughput/total_tokens=870,912,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4537/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=871,104,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4538/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=871,296,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4539/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=871,488,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4540/500000] + optim/total_grad_norm=1.194 + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=871,680,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=4541/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=871,872,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4542/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=872,064,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4543/500000] + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=872,256,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4544/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=872,448,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4545/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=872,640,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4546/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=872,832,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4547/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=873,024,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4548/500000] + train/ActionNoiseL2Loss=0.1034 + throughput/total_tokens=873,216,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4549/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=873,408,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4550/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=873,600,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=4551/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=873,792,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4552/500000] + train/ActionNoiseL2Loss=0.0904 + throughput/total_tokens=873,984,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4553/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=874,176,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4554/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=874,368,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4555/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=874,560,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4556/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=874,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4557/500000] + train/ActionNoiseL2Loss=0.1034 + throughput/total_tokens=874,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4558/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=875,136,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4559/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=875,328,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4560/500000] + optim/total_grad_norm=1.272 + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=875,520,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=4561/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=875,712,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4562/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=875,904,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4563/500000] + train/ActionNoiseL2Loss=0.0792 + throughput/total_tokens=876,096,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4564/500000] + train/ActionNoiseL2Loss=0.1423 + throughput/total_tokens=876,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4565/500000] + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=876,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4566/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=876,672,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4567/500000] + train/ActionNoiseL2Loss=0.0957 + throughput/total_tokens=876,864,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4568/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=877,056,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4569/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=877,248,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4570/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=877,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4571/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=877,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4572/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=877,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4573/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=878,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4574/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=878,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4575/500000] + train/ActionNoiseL2Loss=0.1237 + throughput/total_tokens=878,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4576/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=878,592,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4577/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=878,784,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4578/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=878,976,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4579/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=879,168,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4580/500000] + optim/total_grad_norm=1.092 + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=879,360,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4581/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=879,552,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4582/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=879,744,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4583/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=879,936,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4584/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=880,128,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4585/500000] + train/ActionNoiseL2Loss=0.0836 + throughput/total_tokens=880,320,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4586/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=880,512,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4587/500000] + train/ActionNoiseL2Loss=0.1049 + throughput/total_tokens=880,704,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4588/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=880,896,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4589/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=881,088,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4590/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=881,280,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4591/500000] + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=881,472,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4592/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=881,664,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4593/500000] + train/ActionNoiseL2Loss=0.0747 + throughput/total_tokens=881,856,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4594/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=882,048,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4595/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=882,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4596/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=882,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4597/500000] + train/ActionNoiseL2Loss=0.0312 + throughput/total_tokens=882,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4598/500000] + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=882,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4599/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=883,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4600/500000] + optim/total_grad_norm=1.152 + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=883,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4601/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=883,392,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4602/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=883,584,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4603/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=883,776,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4604/500000] + train/ActionNoiseL2Loss=0.1141 + throughput/total_tokens=883,968,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4605/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=884,160,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4606/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=884,352,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4607/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=884,544,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4608/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=884,736,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4609/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=884,928,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4610/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=885,120,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=4611/500000] + train/ActionNoiseL2Loss=0.0831 + throughput/total_tokens=885,312,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4612/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=885,504,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4613/500000] + train/ActionNoiseL2Loss=0.0823 + throughput/total_tokens=885,696,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4614/500000] + train/ActionNoiseL2Loss=0.0838 + throughput/total_tokens=885,888,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4615/500000] + train/ActionNoiseL2Loss=0.0896 + throughput/total_tokens=886,080,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4616/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=886,272,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4617/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=886,464,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4618/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=886,656,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4619/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=886,848,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4620/500000] + optim/total_grad_norm=1.338 + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=887,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4621/500000] + train/ActionNoiseL2Loss=0.0926 + throughput/total_tokens=887,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4622/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=887,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4623/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=887,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4624/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=887,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4625/500000] + train/ActionNoiseL2Loss=0.1059 + throughput/total_tokens=888,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4626/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=888,192,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4627/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=888,384,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4628/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=888,576,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4629/500000] + train/ActionNoiseL2Loss=0.1078 + throughput/total_tokens=888,768,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4630/500000] + train/ActionNoiseL2Loss=0.0928 + throughput/total_tokens=888,960,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4631/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=889,152,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4632/500000] + train/ActionNoiseL2Loss=0.1760 + throughput/total_tokens=889,344,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4633/500000] + train/ActionNoiseL2Loss=0.1148 + throughput/total_tokens=889,536,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4634/500000] + train/ActionNoiseL2Loss=0.0872 + throughput/total_tokens=889,728,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4635/500000] + train/ActionNoiseL2Loss=0.1021 + throughput/total_tokens=889,920,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4636/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=890,112,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4637/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=890,304,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4638/500000] + train/ActionNoiseL2Loss=0.1068 + throughput/total_tokens=890,496,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4639/500000] + train/ActionNoiseL2Loss=0.1161 + throughput/total_tokens=890,688,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4640/500000] + optim/total_grad_norm=1.534 + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=890,880,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=4641/500000] + train/ActionNoiseL2Loss=0.0930 + throughput/total_tokens=891,072,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4642/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=891,264,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4643/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=891,456,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4644/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=891,648,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=4645/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=891,840,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=4646/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=892,032,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=4647/500000] + train/ActionNoiseL2Loss=0.0741 + throughput/total_tokens=892,224,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=4648/500000] + train/ActionNoiseL2Loss=0.1025 + throughput/total_tokens=892,416,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=4649/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=892,608,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=4650/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=892,800,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=4651/500000] + train/ActionNoiseL2Loss=0.1247 + throughput/total_tokens=892,992,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4652/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=893,184,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4653/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=893,376,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4654/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=893,568,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4655/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=893,760,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4656/500000] + train/ActionNoiseL2Loss=0.1180 + throughput/total_tokens=893,952,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4657/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=894,144,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4658/500000] + train/ActionNoiseL2Loss=0.1372 + throughput/total_tokens=894,336,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4659/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=894,528,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4660/500000] + optim/total_grad_norm=1.739 + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=894,720,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=4661/500000] + train/ActionNoiseL2Loss=0.0871 + throughput/total_tokens=894,912,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4662/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=895,104,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4663/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=895,296,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4664/500000] + train/ActionNoiseL2Loss=0.1870 + throughput/total_tokens=895,488,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4665/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=895,680,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4666/500000] + train/ActionNoiseL2Loss=0.0914 + throughput/total_tokens=895,872,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4667/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=896,064,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4668/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=896,256,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4669/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=896,448,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4670/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=896,640,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=4671/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=896,832,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=4672/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=897,024,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4673/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=897,216,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4674/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=897,408,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4675/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=897,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4676/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=897,792,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4677/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=897,984,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4678/500000] + train/ActionNoiseL2Loss=0.1398 + throughput/total_tokens=898,176,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4679/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=898,368,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4680/500000] + optim/total_grad_norm=1.390 + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=898,560,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4681/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=898,752,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4682/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=898,944,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4683/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=899,136,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4684/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=899,328,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4685/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=899,520,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4686/500000] + train/ActionNoiseL2Loss=0.1076 + throughput/total_tokens=899,712,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4687/500000] + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=899,904,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4688/500000] + train/ActionNoiseL2Loss=0.0966 + throughput/total_tokens=900,096,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4689/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=900,288,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4690/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=900,480,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4691/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=900,672,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4692/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=900,864,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4693/500000] + train/ActionNoiseL2Loss=0.1128 + throughput/total_tokens=901,056,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4694/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=901,248,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4695/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=901,440,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4696/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=901,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4697/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=901,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4698/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=902,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4699/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=902,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4700/500000] + optim/total_grad_norm=1.078 + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=902,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4701/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=902,592,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4702/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=902,784,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4703/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=902,976,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4704/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=903,168,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4705/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=903,360,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4706/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=903,552,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4707/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=903,744,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4708/500000] + train/ActionNoiseL2Loss=0.1070 + throughput/total_tokens=903,936,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4709/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=904,128,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4710/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=904,320,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=4711/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=904,512,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4712/500000] + train/ActionNoiseL2Loss=0.1236 + throughput/total_tokens=904,704,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4713/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=904,896,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4714/500000] + train/ActionNoiseL2Loss=0.0292 + throughput/total_tokens=905,088,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4715/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=905,280,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4716/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=905,472,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4717/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=905,664,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4718/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=905,856,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4719/500000] + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=906,048,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4720/500000] + optim/total_grad_norm=2.057 + train/ActionNoiseL2Loss=0.0918 + throughput/total_tokens=906,240,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4721/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=906,432,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4722/500000] + train/ActionNoiseL2Loss=0.1518 + throughput/total_tokens=906,624,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4723/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=906,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4724/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=907,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4725/500000] + train/ActionNoiseL2Loss=0.1256 + throughput/total_tokens=907,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4726/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=907,392,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4727/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=907,584,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4728/500000] + train/ActionNoiseL2Loss=0.0879 + throughput/total_tokens=907,776,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4729/500000] + train/ActionNoiseL2Loss=0.0370 + throughput/total_tokens=907,968,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4730/500000] + train/ActionNoiseL2Loss=0.0326 + throughput/total_tokens=908,160,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4731/500000] + train/ActionNoiseL2Loss=0.1239 + throughput/total_tokens=908,352,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4732/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=908,544,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4733/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=908,736,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4734/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=908,928,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4735/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=909,120,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4736/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=909,312,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4737/500000] + train/ActionNoiseL2Loss=0.0962 + throughput/total_tokens=909,504,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4738/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=909,696,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4739/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=909,888,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4740/500000] + optim/total_grad_norm=1.538 + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=910,080,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=4741/500000] + train/ActionNoiseL2Loss=0.0918 + throughput/total_tokens=910,272,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4742/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=910,464,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4743/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=910,656,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4744/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=910,848,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4745/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=911,040,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4746/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=911,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4747/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=911,424,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4748/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=911,616,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4749/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=911,808,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4750/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=912,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4751/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=912,192,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4752/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=912,384,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4753/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=912,576,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4754/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=912,768,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4755/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=912,960,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4756/500000] + train/ActionNoiseL2Loss=0.0932 + throughput/total_tokens=913,152,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4757/500000] + train/ActionNoiseL2Loss=0.1002 + throughput/total_tokens=913,344,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4758/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=913,536,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4759/500000] + train/ActionNoiseL2Loss=0.1137 + throughput/total_tokens=913,728,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4760/500000] + optim/total_grad_norm=2.338 + train/ActionNoiseL2Loss=0.1015 + throughput/total_tokens=913,920,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=4761/500000] + train/ActionNoiseL2Loss=0.0888 + throughput/total_tokens=914,112,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4762/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=914,304,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4763/500000] + train/ActionNoiseL2Loss=0.0923 + throughput/total_tokens=914,496,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4764/500000] + train/ActionNoiseL2Loss=0.1040 + throughput/total_tokens=914,688,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4765/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=914,880,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4766/500000] + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=915,072,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4767/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=915,264,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4768/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=915,456,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4769/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=915,648,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4770/500000] + train/ActionNoiseL2Loss=0.1435 + throughput/total_tokens=915,840,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4771/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=916,032,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4772/500000] + train/ActionNoiseL2Loss=0.0999 + throughput/total_tokens=916,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4773/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=916,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4774/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=916,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4775/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=916,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4776/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=916,992,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4777/500000] + train/ActionNoiseL2Loss=0.1135 + throughput/total_tokens=917,184,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4778/500000] + train/ActionNoiseL2Loss=0.1092 + throughput/total_tokens=917,376,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4779/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=917,568,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4780/500000] + optim/total_grad_norm=1.812 + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=917,760,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=4781/500000] + train/ActionNoiseL2Loss=0.1632 + throughput/total_tokens=917,952,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4782/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=918,144,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4783/500000] + train/ActionNoiseL2Loss=0.1076 + throughput/total_tokens=918,336,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4784/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=918,528,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4785/500000] + train/ActionNoiseL2Loss=0.0943 + throughput/total_tokens=918,720,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4786/500000] + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=918,912,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4787/500000] + train/ActionNoiseL2Loss=0.0879 + throughput/total_tokens=919,104,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=4788/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=919,296,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4789/500000] + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=919,488,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4790/500000] + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=919,680,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4791/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=919,872,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4792/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=920,064,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4793/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=920,256,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4794/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=920,448,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4795/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=920,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4796/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=920,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4797/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=921,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4798/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=921,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4799/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=921,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4800/500000] + optim/total_grad_norm=1.799 + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=921,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4801/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=921,792,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4802/500000] + train/ActionNoiseL2Loss=0.1319 + throughput/total_tokens=921,984,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4803/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=922,176,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4804/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=922,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4805/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=922,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4806/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=922,752,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4807/500000] + train/ActionNoiseL2Loss=0.0894 + throughput/total_tokens=922,944,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4808/500000] + train/ActionNoiseL2Loss=0.1356 + throughput/total_tokens=923,136,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4809/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=923,328,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4810/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=923,520,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=4811/500000] + train/ActionNoiseL2Loss=0.0922 + throughput/total_tokens=923,712,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4812/500000] + train/ActionNoiseL2Loss=0.0937 + throughput/total_tokens=923,904,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4813/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=924,096,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4814/500000] + train/ActionNoiseL2Loss=0.1341 + throughput/total_tokens=924,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4815/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=924,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4816/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=924,672,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4817/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=924,864,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4818/500000] + train/ActionNoiseL2Loss=0.0896 + throughput/total_tokens=925,056,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4819/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=925,248,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4820/500000] + optim/total_grad_norm=1.819 + train/ActionNoiseL2Loss=0.0868 + throughput/total_tokens=925,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4821/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=925,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4822/500000] + train/ActionNoiseL2Loss=0.1211 + throughput/total_tokens=925,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4823/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=926,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4824/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=926,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4825/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=926,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4826/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=926,592,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4827/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=926,784,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4828/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=926,976,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4829/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=927,168,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4830/500000] + train/ActionNoiseL2Loss=0.1368 + throughput/total_tokens=927,360,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4831/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=927,552,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4832/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=927,744,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4833/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=927,936,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4834/500000] + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=928,128,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4835/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=928,320,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4836/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=928,512,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4837/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=928,704,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4838/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=928,896,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4839/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=929,088,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4840/500000] + optim/total_grad_norm=1.348 + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=929,280,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4841/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=929,472,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4842/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=929,664,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4843/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=929,856,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4844/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=930,048,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4845/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=930,240,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4846/500000] + train/ActionNoiseL2Loss=0.0363 + throughput/total_tokens=930,432,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4847/500000] + train/ActionNoiseL2Loss=0.0858 + throughput/total_tokens=930,624,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4848/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=930,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4849/500000] + train/ActionNoiseL2Loss=0.0826 + throughput/total_tokens=931,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4850/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=931,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4851/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=931,392,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4852/500000] + train/ActionNoiseL2Loss=0.0410 + throughput/total_tokens=931,584,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4853/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=931,776,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4854/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=931,968,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4855/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=932,160,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4856/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=932,352,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4857/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=932,544,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4858/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=932,736,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4859/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=932,928,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4860/500000] + optim/total_grad_norm=1.935 + train/ActionNoiseL2Loss=0.1258 + throughput/total_tokens=933,120,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=4861/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=933,312,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4862/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=933,504,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4863/500000] + train/ActionNoiseL2Loss=0.1132 + throughput/total_tokens=933,696,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4864/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=933,888,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4865/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=934,080,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4866/500000] + train/ActionNoiseL2Loss=0.1088 + throughput/total_tokens=934,272,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4867/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=934,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4868/500000] + train/ActionNoiseL2Loss=0.1041 + throughput/total_tokens=934,656,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4869/500000] + train/ActionNoiseL2Loss=0.0959 + throughput/total_tokens=934,848,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4870/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=935,040,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4871/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=935,232,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4872/500000] + train/ActionNoiseL2Loss=0.0911 + throughput/total_tokens=935,424,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4873/500000] + train/ActionNoiseL2Loss=0.0792 + throughput/total_tokens=935,616,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4874/500000] + train/ActionNoiseL2Loss=0.1151 + throughput/total_tokens=935,808,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4875/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=936,000,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4876/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=936,192,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4877/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=936,384,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4878/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=936,576,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4879/500000] + train/ActionNoiseL2Loss=0.0936 + throughput/total_tokens=936,768,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4880/500000] + optim/total_grad_norm=1.227 + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=936,960,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4881/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=937,152,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4882/500000] + train/ActionNoiseL2Loss=0.1344 + throughput/total_tokens=937,344,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4883/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=937,536,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4884/500000] + train/ActionNoiseL2Loss=0.0370 + throughput/total_tokens=937,728,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4885/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=937,920,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4886/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=938,112,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4887/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=938,304,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4888/500000] + train/ActionNoiseL2Loss=0.1136 + throughput/total_tokens=938,496,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4889/500000] + train/ActionNoiseL2Loss=0.0910 + throughput/total_tokens=938,688,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4890/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=938,880,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=4891/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=939,072,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4892/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=939,264,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4893/500000] + train/ActionNoiseL2Loss=0.1222 + throughput/total_tokens=939,456,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4894/500000] + train/ActionNoiseL2Loss=0.1238 + throughput/total_tokens=939,648,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4895/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=939,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4896/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=940,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4897/500000] + train/ActionNoiseL2Loss=0.0308 + throughput/total_tokens=940,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4898/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=940,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4899/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=940,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4900/500000] + optim/total_grad_norm=2.155 + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=940,800,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4901/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=940,992,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4902/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=941,184,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=4903/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=941,376,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4904/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=941,568,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4905/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=941,760,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4906/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=941,952,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4907/500000] + train/ActionNoiseL2Loss=0.0818 + throughput/total_tokens=942,144,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4908/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=942,336,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4909/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=942,528,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4910/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=942,720,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=4911/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=942,912,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4912/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=943,104,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4913/500000] + train/ActionNoiseL2Loss=0.0928 + throughput/total_tokens=943,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4914/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=943,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4915/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=943,680,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4916/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=943,872,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4917/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=944,064,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4918/500000] + train/ActionNoiseL2Loss=0.1120 + throughput/total_tokens=944,256,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4919/500000] + train/ActionNoiseL2Loss=0.0691 + throughput/total_tokens=944,448,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=4920/500000] + optim/total_grad_norm=1.806 + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=944,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4921/500000] + train/ActionNoiseL2Loss=0.0894 + throughput/total_tokens=944,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4922/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=945,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4923/500000] + train/ActionNoiseL2Loss=0.1207 + throughput/total_tokens=945,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4924/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=945,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4925/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=945,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4926/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=945,792,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4927/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=945,984,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4928/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=946,176,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4929/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=946,368,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4930/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=946,560,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4931/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=946,752,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4932/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=946,944,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4933/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=947,136,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4934/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=947,328,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4935/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=947,520,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4936/500000] + train/ActionNoiseL2Loss=0.1153 + throughput/total_tokens=947,712,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4937/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=947,904,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4938/500000] + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=948,096,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4939/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=948,288,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4940/500000] + optim/total_grad_norm=1.304 + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=948,480,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4941/500000] + train/ActionNoiseL2Loss=0.0339 + throughput/total_tokens=948,672,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4942/500000] + train/ActionNoiseL2Loss=0.1272 + throughput/total_tokens=948,864,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4943/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=949,056,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4944/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=949,248,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4945/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=949,440,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4946/500000] + train/ActionNoiseL2Loss=0.1066 + throughput/total_tokens=949,632,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4947/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=949,824,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4948/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=950,016,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4949/500000] + train/ActionNoiseL2Loss=0.1214 + throughput/total_tokens=950,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4950/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=950,400,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4951/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=950,592,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4952/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=950,784,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4953/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=950,976,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4954/500000] + train/ActionNoiseL2Loss=0.0976 + throughput/total_tokens=951,168,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4955/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=951,360,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4956/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=951,552,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4957/500000] + train/ActionNoiseL2Loss=0.1260 + throughput/total_tokens=951,744,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4958/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=951,936,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4959/500000] + train/ActionNoiseL2Loss=0.0836 + throughput/total_tokens=952,128,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4960/500000] + optim/total_grad_norm=1.824 + train/ActionNoiseL2Loss=0.1404 + throughput/total_tokens=952,320,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=4961/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=952,512,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4962/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=952,704,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4963/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=952,896,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4964/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=953,088,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4965/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=953,280,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4966/500000] + train/ActionNoiseL2Loss=0.0881 + throughput/total_tokens=953,472,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4967/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=953,664,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4968/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=953,856,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=4969/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=954,048,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=4970/500000] + train/ActionNoiseL2Loss=0.0905 + throughput/total_tokens=954,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4971/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=954,432,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4972/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=954,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4973/500000] + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=954,816,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4974/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=955,008,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4975/500000] + train/ActionNoiseL2Loss=0.0836 + throughput/total_tokens=955,200,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4976/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=955,392,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4977/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=955,584,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4978/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=955,776,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4979/500000] + train/ActionNoiseL2Loss=0.0241 + throughput/total_tokens=955,968,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4980/500000] + optim/total_grad_norm=2.299 + train/ActionNoiseL2Loss=0.1010 + throughput/total_tokens=956,160,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4981/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=956,352,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4982/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=956,544,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4983/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=956,736,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4984/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=956,928,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4985/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=957,120,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4986/500000] + train/ActionNoiseL2Loss=0.1190 + throughput/total_tokens=957,312,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4987/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=957,504,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4988/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=957,696,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4989/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=957,888,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4990/500000] + train/ActionNoiseL2Loss=0.1365 + throughput/total_tokens=958,080,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=4991/500000] + train/ActionNoiseL2Loss=0.0904 + throughput/total_tokens=958,272,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4992/500000] + train/ActionNoiseL2Loss=0.0853 + throughput/total_tokens=958,464,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=4993/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=958,656,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4994/500000] + train/ActionNoiseL2Loss=0.0940 + throughput/total_tokens=958,848,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4995/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=959,040,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4996/500000] + train/ActionNoiseL2Loss=0.0290 + throughput/total_tokens=959,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4997/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=959,424,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4998/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=959,616,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=4999/500000] + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=959,808,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5000/500000] + optim/total_grad_norm=2.016 + train/ActionNoiseL2Loss=0.1173 + throughput/total_tokens=960,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +10/06 [22:19:47] INFO | >> Saving config... checkpoint.py:608 +10/06 [22:20:21] INFO | >> Saving model state... checkpoint.py:796 +10/06 [22:21:35] INFO | >> Saving optim state... checkpoint.py:811 +10/06 [22:23:03] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=5001/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=960,192,000 + throughput/device/tokens_per_second=1,187 + throughput/device/batches_per_second=0.0495 +[step=5002/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=960,384,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5003/500000] + train/ActionNoiseL2Loss=0.1315 + throughput/total_tokens=960,576,000 + throughput/device/tokens_per_second=1,131 + throughput/device/batches_per_second=0.0472 +[step=5004/500000] + train/ActionNoiseL2Loss=0.0965 + throughput/total_tokens=960,768,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=5005/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=960,960,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0475 +[step=5006/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=961,152,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=5007/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=961,344,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=5008/500000] + train/ActionNoiseL2Loss=0.1420 + throughput/total_tokens=961,536,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5009/500000] + train/ActionNoiseL2Loss=0.1190 + throughput/total_tokens=961,728,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5010/500000] + train/ActionNoiseL2Loss=0.0914 + throughput/total_tokens=961,920,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=46,467 +[step=5011/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=962,112,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5012/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=962,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5013/500000] + train/ActionNoiseL2Loss=0.1027 + throughput/total_tokens=962,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5014/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=962,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5015/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=962,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5016/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=963,072,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5017/500000] + train/ActionNoiseL2Loss=0.0941 + throughput/total_tokens=963,264,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5018/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=963,456,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=5019/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=963,648,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=5020/500000] + optim/total_grad_norm=1.252 + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=963,840,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=5021/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=964,032,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=5022/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=964,224,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=5023/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=964,416,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5024/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=964,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5025/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=964,800,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5026/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=964,992,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5027/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=965,184,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5028/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=965,376,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5029/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=965,568,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5030/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=965,760,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5031/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=965,952,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5032/500000] + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=966,144,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5033/500000] + train/ActionNoiseL2Loss=0.1393 + throughput/total_tokens=966,336,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5034/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=966,528,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5035/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=966,720,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5036/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=966,912,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5037/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=967,104,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5038/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=967,296,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5039/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=967,488,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5040/500000] + optim/total_grad_norm=1.450 + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=967,680,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5041/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=967,872,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5042/500000] + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=968,064,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5043/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=968,256,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5044/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=968,448,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5045/500000] + train/ActionNoiseL2Loss=0.0899 + throughput/total_tokens=968,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5046/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=968,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5047/500000] + train/ActionNoiseL2Loss=0.0994 + throughput/total_tokens=969,024,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5048/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=969,216,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5049/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=969,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5050/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=969,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5051/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=969,792,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5052/500000] + train/ActionNoiseL2Loss=0.0831 + throughput/total_tokens=969,984,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5053/500000] + train/ActionNoiseL2Loss=0.0832 + throughput/total_tokens=970,176,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5054/500000] + train/ActionNoiseL2Loss=0.0988 + throughput/total_tokens=970,368,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5055/500000] + train/ActionNoiseL2Loss=0.0888 + throughput/total_tokens=970,560,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5056/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=970,752,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5057/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=970,944,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5058/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=971,136,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5059/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=971,328,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5060/500000] + optim/total_grad_norm=2.248 + train/ActionNoiseL2Loss=0.0802 + throughput/total_tokens=971,520,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=5061/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=971,712,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5062/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=971,904,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5063/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=972,096,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5064/500000] + train/ActionNoiseL2Loss=0.0709 + throughput/total_tokens=972,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5065/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=972,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5066/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=972,672,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5067/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=972,864,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5068/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=973,056,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5069/500000] + train/ActionNoiseL2Loss=0.1302 + throughput/total_tokens=973,248,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5070/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=973,440,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5071/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=973,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5072/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=973,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5073/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=974,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5074/500000] + train/ActionNoiseL2Loss=0.0293 + throughput/total_tokens=974,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5075/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=974,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5076/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=974,592,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5077/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=974,784,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5078/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=974,976,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5079/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=975,168,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5080/500000] + optim/total_grad_norm=1.114 + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=975,360,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5081/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=975,552,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5082/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=975,744,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5083/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=975,936,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5084/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=976,128,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5085/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=976,320,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5086/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=976,512,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5087/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=976,704,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5088/500000] + train/ActionNoiseL2Loss=0.1169 + throughput/total_tokens=976,896,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5089/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=977,088,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5090/500000] + train/ActionNoiseL2Loss=0.0999 + throughput/total_tokens=977,280,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5091/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=977,472,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5092/500000] + train/ActionNoiseL2Loss=0.0892 + throughput/total_tokens=977,664,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5093/500000] + train/ActionNoiseL2Loss=0.1587 + throughput/total_tokens=977,856,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5094/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=978,048,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5095/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=978,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5096/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=978,432,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5097/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=978,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5098/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=978,816,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5099/500000] + train/ActionNoiseL2Loss=0.1045 + throughput/total_tokens=979,008,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5100/500000] + optim/total_grad_norm=1.507 + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=979,200,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5101/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=979,392,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5102/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=979,584,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5103/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=979,776,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5104/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=979,968,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5105/500000] + train/ActionNoiseL2Loss=0.1062 + throughput/total_tokens=980,160,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5106/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=980,352,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5107/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=980,544,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5108/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=980,736,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5109/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=980,928,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5110/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=981,120,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=5111/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=981,312,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5112/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=981,504,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5113/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=981,696,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5114/500000] + train/ActionNoiseL2Loss=0.0872 + throughput/total_tokens=981,888,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5115/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=982,080,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5116/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=982,272,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5117/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=982,464,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5118/500000] + train/ActionNoiseL2Loss=0.0954 + throughput/total_tokens=982,656,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5119/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=982,848,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5120/500000] + optim/total_grad_norm=1.632 + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=983,040,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=5121/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=983,232,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5122/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=983,424,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5123/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=983,616,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5124/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=983,808,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5125/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=984,000,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5126/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=984,192,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5127/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=984,384,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5128/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=984,576,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5129/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=984,768,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5130/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=984,960,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=5131/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=985,152,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5132/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=985,344,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5133/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=985,536,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5134/500000] + train/ActionNoiseL2Loss=0.0863 + throughput/total_tokens=985,728,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5135/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=985,920,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5136/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=986,112,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5137/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=986,304,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5138/500000] + train/ActionNoiseL2Loss=0.0958 + throughput/total_tokens=986,496,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5139/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=986,688,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5140/500000] + optim/total_grad_norm=1.585 + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=986,880,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5141/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=987,072,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5142/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=987,264,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5143/500000] + train/ActionNoiseL2Loss=0.0840 + throughput/total_tokens=987,456,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5144/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=987,648,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5145/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=987,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5146/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=988,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5147/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=988,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5148/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=988,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5149/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=988,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5150/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=988,800,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5151/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=988,992,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5152/500000] + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=989,184,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5153/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=989,376,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5154/500000] + train/ActionNoiseL2Loss=0.0921 + throughput/total_tokens=989,568,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5155/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=989,760,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5156/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=989,952,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5157/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=990,144,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5158/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=990,336,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5159/500000] + train/ActionNoiseL2Loss=0.0989 + throughput/total_tokens=990,528,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5160/500000] + optim/total_grad_norm=1.790 + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=990,720,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=5161/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=990,912,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5162/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=991,104,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5163/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=991,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5164/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=991,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5165/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=991,680,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5166/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=991,872,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5167/500000] + train/ActionNoiseL2Loss=0.1078 + throughput/total_tokens=992,064,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5168/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=992,256,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5169/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=992,448,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5170/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=992,640,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5171/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=992,832,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5172/500000] + train/ActionNoiseL2Loss=0.0955 + throughput/total_tokens=993,024,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5173/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=993,216,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5174/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=993,408,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5175/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=993,600,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5176/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=993,792,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5177/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=993,984,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5178/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=994,176,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5179/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=994,368,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5180/500000] + optim/total_grad_norm=1.354 + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=994,560,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5181/500000] + train/ActionNoiseL2Loss=0.0894 + throughput/total_tokens=994,752,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5182/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=994,944,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5183/500000] + train/ActionNoiseL2Loss=0.0971 + throughput/total_tokens=995,136,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5184/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=995,328,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5185/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=995,520,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5186/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=995,712,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5187/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=995,904,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5188/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=996,096,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5189/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=996,288,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5190/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=996,480,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5191/500000] + train/ActionNoiseL2Loss=0.1052 + throughput/total_tokens=996,672,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5192/500000] + train/ActionNoiseL2Loss=0.0335 + throughput/total_tokens=996,864,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5193/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=997,056,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5194/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=997,248,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5195/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=997,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5196/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=997,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5197/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=997,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5198/500000] + train/ActionNoiseL2Loss=0.1300 + throughput/total_tokens=998,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5199/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=998,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5200/500000] + optim/total_grad_norm=1.582 + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=998,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=5201/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=998,592,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5202/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=998,784,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5203/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=998,976,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5204/500000] + train/ActionNoiseL2Loss=0.1517 + throughput/total_tokens=999,168,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5205/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=999,360,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5206/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=999,552,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5207/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=999,744,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5208/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=999,936,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5209/500000] + train/ActionNoiseL2Loss=0.1025 + throughput/total_tokens=1,000,128,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5210/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=1,000,320,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=5211/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=1,000,512,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5212/500000] + train/ActionNoiseL2Loss=0.0876 + throughput/total_tokens=1,000,704,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5213/500000] + train/ActionNoiseL2Loss=0.0824 + throughput/total_tokens=1,000,896,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5214/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,001,088,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5215/500000] + train/ActionNoiseL2Loss=0.0331 + throughput/total_tokens=1,001,280,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5216/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,001,472,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5217/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,001,664,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5218/500000] + train/ActionNoiseL2Loss=0.0345 + throughput/total_tokens=1,001,856,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5219/500000] + train/ActionNoiseL2Loss=0.1300 + throughput/total_tokens=1,002,048,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5220/500000] + optim/total_grad_norm=1.530 + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=1,002,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5221/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,002,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5222/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=1,002,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5223/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=1,002,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5224/500000] + train/ActionNoiseL2Loss=0.1193 + throughput/total_tokens=1,003,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5225/500000] + train/ActionNoiseL2Loss=0.1006 + throughput/total_tokens=1,003,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5226/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=1,003,392,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5227/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=1,003,584,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5228/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=1,003,776,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5229/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,003,968,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5230/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,004,160,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5231/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=1,004,352,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5232/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,004,544,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5233/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=1,004,736,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5234/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,004,928,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5235/500000] + train/ActionNoiseL2Loss=0.0878 + throughput/total_tokens=1,005,120,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5236/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,005,312,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5237/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,005,504,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5238/500000] + train/ActionNoiseL2Loss=0.0955 + throughput/total_tokens=1,005,696,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5239/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,005,888,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5240/500000] + optim/total_grad_norm=1.362 + train/ActionNoiseL2Loss=0.0363 + throughput/total_tokens=1,006,080,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5241/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=1,006,272,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5242/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,006,464,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5243/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=1,006,656,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5244/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=1,006,848,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5245/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,007,040,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5246/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,007,232,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5247/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,007,424,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5248/500000] + train/ActionNoiseL2Loss=0.0868 + throughput/total_tokens=1,007,616,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5249/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=1,007,808,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5250/500000] + train/ActionNoiseL2Loss=0.0985 + throughput/total_tokens=1,008,000,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5251/500000] + train/ActionNoiseL2Loss=0.1769 + throughput/total_tokens=1,008,192,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5252/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,008,384,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5253/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,008,576,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5254/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=1,008,768,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5255/500000] + train/ActionNoiseL2Loss=0.1020 + throughput/total_tokens=1,008,960,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5256/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=1,009,152,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5257/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,009,344,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5258/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,009,536,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5259/500000] + train/ActionNoiseL2Loss=0.1309 + throughput/total_tokens=1,009,728,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5260/500000] + optim/total_grad_norm=2.373 + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,009,920,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=5261/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,010,112,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5262/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=1,010,304,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5263/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=1,010,496,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5264/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=1,010,688,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5265/500000] + train/ActionNoiseL2Loss=0.1090 + throughput/total_tokens=1,010,880,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5266/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=1,011,072,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5267/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,011,264,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5268/500000] + train/ActionNoiseL2Loss=0.0284 + throughput/total_tokens=1,011,456,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5269/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=1,011,648,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5270/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,011,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5271/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,012,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5272/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,012,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5273/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,012,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5274/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=1,012,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5275/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=1,012,800,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5276/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=1,012,992,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5277/500000] + train/ActionNoiseL2Loss=0.0911 + throughput/total_tokens=1,013,184,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5278/500000] + train/ActionNoiseL2Loss=0.1163 + throughput/total_tokens=1,013,376,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5279/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,013,568,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5280/500000] + optim/total_grad_norm=1.359 + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=1,013,760,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5281/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=1,013,952,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5282/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,014,144,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5283/500000] + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=1,014,336,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5284/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,014,528,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5285/500000] + train/ActionNoiseL2Loss=0.1269 + throughput/total_tokens=1,014,720,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5286/500000] + train/ActionNoiseL2Loss=0.0989 + throughput/total_tokens=1,014,912,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5287/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=1,015,104,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5288/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,015,296,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5289/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,015,488,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5290/500000] + train/ActionNoiseL2Loss=0.0305 + throughput/total_tokens=1,015,680,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5291/500000] + train/ActionNoiseL2Loss=0.0345 + throughput/total_tokens=1,015,872,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5292/500000] + train/ActionNoiseL2Loss=0.0987 + throughput/total_tokens=1,016,064,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5293/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,016,256,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5294/500000] + train/ActionNoiseL2Loss=0.0962 + throughput/total_tokens=1,016,448,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5295/500000] + train/ActionNoiseL2Loss=0.0919 + throughput/total_tokens=1,016,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5296/500000] + train/ActionNoiseL2Loss=0.1073 + throughput/total_tokens=1,016,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5297/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,017,024,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5298/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,017,216,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5299/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=1,017,408,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5300/500000] + optim/total_grad_norm=1.304 + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,017,600,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5301/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,017,792,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5302/500000] + train/ActionNoiseL2Loss=0.0946 + throughput/total_tokens=1,017,984,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5303/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,018,176,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5304/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=1,018,368,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5305/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,018,560,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5306/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=1,018,752,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5307/500000] + train/ActionNoiseL2Loss=0.1292 + throughput/total_tokens=1,018,944,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5308/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=1,019,136,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5309/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=1,019,328,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5310/500000] + train/ActionNoiseL2Loss=0.1742 + throughput/total_tokens=1,019,520,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=5311/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=1,019,712,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5312/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=1,019,904,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5313/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,020,096,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5314/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,020,288,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5315/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,020,480,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5316/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,020,672,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5317/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,020,864,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5318/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=1,021,056,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5319/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=1,021,248,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5320/500000] + optim/total_grad_norm=1.560 + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=1,021,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5321/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=1,021,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5322/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=1,021,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5323/500000] + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=1,022,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5324/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,022,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5325/500000] + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=1,022,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5326/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=1,022,592,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5327/500000] + train/ActionNoiseL2Loss=0.0858 + throughput/total_tokens=1,022,784,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5328/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,022,976,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5329/500000] + train/ActionNoiseL2Loss=0.0965 + throughput/total_tokens=1,023,168,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5330/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,023,360,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5331/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,023,552,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5332/500000] + train/ActionNoiseL2Loss=0.0940 + throughput/total_tokens=1,023,744,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5333/500000] + train/ActionNoiseL2Loss=0.0899 + throughput/total_tokens=1,023,936,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5334/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,024,128,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5335/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=1,024,320,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5336/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=1,024,512,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5337/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,024,704,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5338/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=1,024,896,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5339/500000] + train/ActionNoiseL2Loss=0.1055 + throughput/total_tokens=1,025,088,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5340/500000] + optim/total_grad_norm=1.912 + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=1,025,280,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5341/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=1,025,472,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5342/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=1,025,664,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5343/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,025,856,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5344/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=1,026,048,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5345/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=1,026,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5346/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=1,026,432,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5347/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,026,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5348/500000] + train/ActionNoiseL2Loss=0.0274 + throughput/total_tokens=1,026,816,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5349/500000] + train/ActionNoiseL2Loss=0.0247 + throughput/total_tokens=1,027,008,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5350/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,027,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5351/500000] + train/ActionNoiseL2Loss=0.1273 + throughput/total_tokens=1,027,392,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5352/500000] + train/ActionNoiseL2Loss=0.0391 + throughput/total_tokens=1,027,584,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5353/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=1,027,776,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5354/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,027,968,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5355/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,028,160,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5356/500000] + train/ActionNoiseL2Loss=0.0849 + throughput/total_tokens=1,028,352,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5357/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,028,544,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5358/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=1,028,736,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5359/500000] + train/ActionNoiseL2Loss=0.1128 + throughput/total_tokens=1,028,928,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5360/500000] + optim/total_grad_norm=1.873 + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=1,029,120,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=5361/500000] + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=1,029,312,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5362/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=1,029,504,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5363/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,029,696,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5364/500000] + train/ActionNoiseL2Loss=0.0901 + throughput/total_tokens=1,029,888,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5365/500000] + train/ActionNoiseL2Loss=0.1176 + throughput/total_tokens=1,030,080,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5366/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=1,030,272,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5367/500000] + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=1,030,464,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5368/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=1,030,656,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5369/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=1,030,848,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5370/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=1,031,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5371/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=1,031,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5372/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,031,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5373/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=1,031,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5374/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=1,031,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5375/500000] + train/ActionNoiseL2Loss=0.1058 + throughput/total_tokens=1,032,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5376/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=1,032,192,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5377/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=1,032,384,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5378/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,032,576,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5379/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=1,032,768,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5380/500000] + optim/total_grad_norm=1.986 + train/ActionNoiseL2Loss=0.1052 + throughput/total_tokens=1,032,960,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5381/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=1,033,152,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5382/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=1,033,344,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5383/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=1,033,536,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5384/500000] + train/ActionNoiseL2Loss=0.0752 + throughput/total_tokens=1,033,728,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5385/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,033,920,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5386/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=1,034,112,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5387/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,034,304,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5388/500000] + train/ActionNoiseL2Loss=0.1576 + throughput/total_tokens=1,034,496,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5389/500000] + train/ActionNoiseL2Loss=0.0741 + throughput/total_tokens=1,034,688,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5390/500000] + train/ActionNoiseL2Loss=0.1162 + throughput/total_tokens=1,034,880,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5391/500000] + train/ActionNoiseL2Loss=0.1218 + throughput/total_tokens=1,035,072,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5392/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=1,035,264,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5393/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=1,035,456,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5394/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=1,035,648,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5395/500000] + train/ActionNoiseL2Loss=0.0314 + throughput/total_tokens=1,035,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5396/500000] + train/ActionNoiseL2Loss=0.1076 + throughput/total_tokens=1,036,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5397/500000] + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=1,036,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5398/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,036,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5399/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=1,036,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5400/500000] + optim/total_grad_norm=1.451 + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=1,036,800,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5401/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,036,992,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5402/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,037,184,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5403/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=1,037,376,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5404/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,037,568,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5405/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,037,760,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5406/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,037,952,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5407/500000] + train/ActionNoiseL2Loss=0.1646 + throughput/total_tokens=1,038,144,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5408/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,038,336,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5409/500000] + train/ActionNoiseL2Loss=0.0988 + throughput/total_tokens=1,038,528,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5410/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,038,720,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=5411/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=1,038,912,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5412/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=1,039,104,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5413/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=1,039,296,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5414/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=1,039,488,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5415/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=1,039,680,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5416/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=1,039,872,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5417/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,040,064,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5418/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=1,040,256,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5419/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,040,448,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5420/500000] + optim/total_grad_norm=1.545 + train/ActionNoiseL2Loss=0.1041 + throughput/total_tokens=1,040,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5421/500000] + train/ActionNoiseL2Loss=0.0868 + throughput/total_tokens=1,040,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5422/500000] + train/ActionNoiseL2Loss=0.0325 + throughput/total_tokens=1,041,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5423/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,041,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5424/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=1,041,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5425/500000] + train/ActionNoiseL2Loss=0.0872 + throughput/total_tokens=1,041,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5426/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,041,792,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5427/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,041,984,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5428/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,042,176,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5429/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=1,042,368,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5430/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=1,042,560,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5431/500000] + train/ActionNoiseL2Loss=0.0339 + throughput/total_tokens=1,042,752,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5432/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,042,944,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5433/500000] + train/ActionNoiseL2Loss=0.0295 + throughput/total_tokens=1,043,136,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5434/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,043,328,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5435/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=1,043,520,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5436/500000] + train/ActionNoiseL2Loss=0.1153 + throughput/total_tokens=1,043,712,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5437/500000] + train/ActionNoiseL2Loss=0.0954 + throughput/total_tokens=1,043,904,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5438/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=1,044,096,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5439/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,044,288,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5440/500000] + optim/total_grad_norm=1.272 + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,044,480,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5441/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=1,044,672,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5442/500000] + train/ActionNoiseL2Loss=0.1009 + throughput/total_tokens=1,044,864,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5443/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=1,045,056,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5444/500000] + train/ActionNoiseL2Loss=0.1374 + throughput/total_tokens=1,045,248,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5445/500000] + train/ActionNoiseL2Loss=0.1106 + throughput/total_tokens=1,045,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5446/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,045,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5447/500000] + train/ActionNoiseL2Loss=0.1115 + throughput/total_tokens=1,045,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5448/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=1,046,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5449/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,046,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5450/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,046,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5451/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=1,046,592,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5452/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=1,046,784,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5453/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=1,046,976,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5454/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,047,168,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5455/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=1,047,360,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5456/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=1,047,552,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5457/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=1,047,744,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5458/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=1,047,936,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5459/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,048,128,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5460/500000] + optim/total_grad_norm=1.357 + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,048,320,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=5461/500000] + train/ActionNoiseL2Loss=0.1414 + throughput/total_tokens=1,048,512,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5462/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,048,704,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5463/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,048,896,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5464/500000] + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=1,049,088,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5465/500000] + train/ActionNoiseL2Loss=0.0261 + throughput/total_tokens=1,049,280,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5466/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=1,049,472,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5467/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=1,049,664,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5468/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=1,049,856,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5469/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,050,048,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5470/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,050,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5471/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=1,050,432,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5472/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,050,624,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5473/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=1,050,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5474/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,051,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5475/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=1,051,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5476/500000] + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=1,051,392,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5477/500000] + train/ActionNoiseL2Loss=0.0266 + throughput/total_tokens=1,051,584,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5478/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=1,051,776,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5479/500000] + train/ActionNoiseL2Loss=0.1090 + throughput/total_tokens=1,051,968,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5480/500000] + optim/total_grad_norm=2.145 + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=1,052,160,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5481/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,052,352,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5482/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=1,052,544,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5483/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=1,052,736,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5484/500000] + train/ActionNoiseL2Loss=0.1023 + throughput/total_tokens=1,052,928,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5485/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=1,053,120,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5486/500000] + train/ActionNoiseL2Loss=0.1126 + throughput/total_tokens=1,053,312,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5487/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,053,504,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5488/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=1,053,696,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5489/500000] + train/ActionNoiseL2Loss=0.0410 + throughput/total_tokens=1,053,888,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5490/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,054,080,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=5491/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=1,054,272,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5492/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=1,054,464,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5493/500000] + train/ActionNoiseL2Loss=0.1040 + throughput/total_tokens=1,054,656,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5494/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=1,054,848,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5495/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,055,040,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5496/500000] + train/ActionNoiseL2Loss=0.1047 + throughput/total_tokens=1,055,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5497/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=1,055,424,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5498/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,055,616,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5499/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,055,808,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5500/500000] + optim/total_grad_norm=1.459 + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,056,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +10/07 [01:17:45] INFO | >> Saving config... checkpoint.py:608 +10/07 [01:18:19] INFO | >> Saving model state... checkpoint.py:796 +10/07 [01:19:33] INFO | >> Saving optim state... checkpoint.py:811 +10/07 [01:21:07] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=5501/500000] + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=1,056,192,000 + throughput/device/tokens_per_second=1,197 + throughput/device/batches_per_second=0.0499 +[step=5502/500000] + train/ActionNoiseL2Loss=0.0944 + throughput/total_tokens=1,056,384,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5503/500000] + train/ActionNoiseL2Loss=0.0894 + throughput/total_tokens=1,056,576,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=5504/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,056,768,000 + throughput/device/tokens_per_second=1,166 + throughput/device/batches_per_second=0.0486 +[step=5505/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=1,056,960,000 + throughput/device/tokens_per_second=1,164 + throughput/device/batches_per_second=0.0485 +[step=5506/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=1,057,152,000 + throughput/device/tokens_per_second=1,163 + throughput/device/batches_per_second=0.0485 +[step=5507/500000] + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=1,057,344,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=5508/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=1,057,536,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5509/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,057,728,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5510/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=1,057,920,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=5511/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=1,058,112,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5512/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,058,304,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5513/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=1,058,496,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5514/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,058,688,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5515/500000] + train/ActionNoiseL2Loss=0.1436 + throughput/total_tokens=1,058,880,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5516/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=1,059,072,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5517/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=1,059,264,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5518/500000] + train/ActionNoiseL2Loss=0.0998 + throughput/total_tokens=1,059,456,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5519/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=1,059,648,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5520/500000] + optim/total_grad_norm=1.279 + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=1,059,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5521/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=1,060,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5522/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=1,060,224,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5523/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=1,060,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5524/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=1,060,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5525/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=1,060,800,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5526/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=1,060,992,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5527/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=1,061,184,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5528/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,061,376,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5529/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=1,061,568,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5530/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,061,760,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5531/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=1,061,952,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5532/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,062,144,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5533/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=1,062,336,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5534/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,062,528,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5535/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=1,062,720,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5536/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=1,062,912,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5537/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=1,063,104,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5538/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=1,063,296,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5539/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=1,063,488,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5540/500000] + optim/total_grad_norm=1.902 + train/ActionNoiseL2Loss=0.1325 + throughput/total_tokens=1,063,680,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5541/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=1,063,872,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5542/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=1,064,064,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5543/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=1,064,256,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5544/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=1,064,448,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5545/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=1,064,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5546/500000] + train/ActionNoiseL2Loss=0.0919 + throughput/total_tokens=1,064,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5547/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=1,065,024,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5548/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,065,216,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5549/500000] + train/ActionNoiseL2Loss=0.1208 + throughput/total_tokens=1,065,408,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5550/500000] + train/ActionNoiseL2Loss=0.0957 + throughput/total_tokens=1,065,600,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5551/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=1,065,792,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5552/500000] + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=1,065,984,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5553/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,066,176,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5554/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,066,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5555/500000] + train/ActionNoiseL2Loss=0.1438 + throughput/total_tokens=1,066,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5556/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=1,066,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5557/500000] + train/ActionNoiseL2Loss=0.0916 + throughput/total_tokens=1,066,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5558/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=1,067,136,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5559/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=1,067,328,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5560/500000] + optim/total_grad_norm=1.999 + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=1,067,520,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=5561/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,067,712,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5562/500000] + train/ActionNoiseL2Loss=0.0239 + throughput/total_tokens=1,067,904,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5563/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,068,096,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5564/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,068,288,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5565/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=1,068,480,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5566/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,068,672,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5567/500000] + train/ActionNoiseL2Loss=0.1052 + throughput/total_tokens=1,068,864,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5568/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,069,056,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5569/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=1,069,248,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5570/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,069,440,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=5571/500000] + train/ActionNoiseL2Loss=0.1110 + throughput/total_tokens=1,069,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5572/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,069,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5573/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,070,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5574/500000] + train/ActionNoiseL2Loss=0.0896 + throughput/total_tokens=1,070,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5575/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,070,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5576/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=1,070,592,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5577/500000] + train/ActionNoiseL2Loss=0.1046 + throughput/total_tokens=1,070,784,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5578/500000] + train/ActionNoiseL2Loss=0.0990 + throughput/total_tokens=1,070,976,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5579/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=1,071,168,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5580/500000] + optim/total_grad_norm=1.198 + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=1,071,360,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=5581/500000] + train/ActionNoiseL2Loss=0.1127 + throughput/total_tokens=1,071,552,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5582/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=1,071,744,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5583/500000] + train/ActionNoiseL2Loss=0.0909 + throughput/total_tokens=1,071,936,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5584/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,072,128,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5585/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,072,320,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5586/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,072,512,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5587/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,072,704,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5588/500000] + train/ActionNoiseL2Loss=0.0367 + throughput/total_tokens=1,072,896,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5589/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,073,088,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5590/500000] + train/ActionNoiseL2Loss=0.1385 + throughput/total_tokens=1,073,280,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5591/500000] + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=1,073,472,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5592/500000] + train/ActionNoiseL2Loss=0.0848 + throughput/total_tokens=1,073,664,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5593/500000] + train/ActionNoiseL2Loss=0.1175 + throughput/total_tokens=1,073,856,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5594/500000] + train/ActionNoiseL2Loss=0.1148 + throughput/total_tokens=1,074,048,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5595/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=1,074,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5596/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=1,074,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5597/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,074,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5598/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,074,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5599/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=1,075,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5600/500000] + optim/total_grad_norm=1.864 + train/ActionNoiseL2Loss=0.1125 + throughput/total_tokens=1,075,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5601/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=1,075,392,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5602/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=1,075,584,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5603/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=1,075,776,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5604/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=1,075,968,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5605/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=1,076,160,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5606/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=1,076,352,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5607/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=1,076,544,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5608/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=1,076,736,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5609/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,076,928,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5610/500000] + train/ActionNoiseL2Loss=0.1842 + throughput/total_tokens=1,077,120,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=5611/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=1,077,312,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5612/500000] + train/ActionNoiseL2Loss=0.0923 + throughput/total_tokens=1,077,504,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5613/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,077,696,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5614/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,077,888,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5615/500000] + train/ActionNoiseL2Loss=0.1044 + throughput/total_tokens=1,078,080,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5616/500000] + train/ActionNoiseL2Loss=0.1202 + throughput/total_tokens=1,078,272,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5617/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,078,464,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5618/500000] + train/ActionNoiseL2Loss=0.0288 + throughput/total_tokens=1,078,656,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5619/500000] + train/ActionNoiseL2Loss=0.0989 + throughput/total_tokens=1,078,848,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5620/500000] + optim/total_grad_norm=1.532 + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=1,079,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5621/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=1,079,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5622/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=1,079,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5623/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=1,079,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5624/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=1,079,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5625/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=1,080,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5626/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=1,080,192,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5627/500000] + train/ActionNoiseL2Loss=0.0945 + throughput/total_tokens=1,080,384,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5628/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=1,080,576,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5629/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=1,080,768,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5630/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,080,960,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=5631/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,081,152,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5632/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,081,344,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5633/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=1,081,536,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5634/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,081,728,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5635/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=1,081,920,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5636/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=1,082,112,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5637/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,082,304,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5638/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,082,496,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5639/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=1,082,688,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5640/500000] + optim/total_grad_norm=1.579 + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=1,082,880,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=5641/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,083,072,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5642/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=1,083,264,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5643/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=1,083,456,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5644/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=1,083,648,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5645/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,083,840,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5646/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,084,032,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5647/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,084,224,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5648/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,084,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5649/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=1,084,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5650/500000] + train/ActionNoiseL2Loss=0.1355 + throughput/total_tokens=1,084,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5651/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=1,084,992,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5652/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=1,085,184,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5653/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=1,085,376,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5654/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=1,085,568,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5655/500000] + train/ActionNoiseL2Loss=0.1467 + throughput/total_tokens=1,085,760,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5656/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=1,085,952,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5657/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,086,144,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5658/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=1,086,336,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5659/500000] + train/ActionNoiseL2Loss=0.0896 + throughput/total_tokens=1,086,528,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5660/500000] + optim/total_grad_norm=2.080 + train/ActionNoiseL2Loss=0.1146 + throughput/total_tokens=1,086,720,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=5661/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,086,912,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5662/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=1,087,104,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5663/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,087,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5664/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=1,087,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5665/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,087,680,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5666/500000] + train/ActionNoiseL2Loss=0.1126 + throughput/total_tokens=1,087,872,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5667/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,088,064,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5668/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,088,256,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5669/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=1,088,448,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5670/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=1,088,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5671/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=1,088,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5672/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=1,089,024,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5673/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=1,089,216,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5674/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=1,089,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5675/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,089,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5676/500000] + train/ActionNoiseL2Loss=0.0832 + throughput/total_tokens=1,089,792,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5677/500000] + train/ActionNoiseL2Loss=0.1172 + throughput/total_tokens=1,089,984,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5678/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,090,176,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5679/500000] + train/ActionNoiseL2Loss=0.1227 + throughput/total_tokens=1,090,368,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5680/500000] + optim/total_grad_norm=1.690 + train/ActionNoiseL2Loss=0.0996 + throughput/total_tokens=1,090,560,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5681/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,090,752,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5682/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=1,090,944,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5683/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,091,136,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5684/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,091,328,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5685/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=1,091,520,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5686/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=1,091,712,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5687/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=1,091,904,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5688/500000] + train/ActionNoiseL2Loss=0.0944 + throughput/total_tokens=1,092,096,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5689/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,092,288,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5690/500000] + train/ActionNoiseL2Loss=0.1105 + throughput/total_tokens=1,092,480,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5691/500000] + train/ActionNoiseL2Loss=0.0265 + throughput/total_tokens=1,092,672,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5692/500000] + train/ActionNoiseL2Loss=0.0339 + throughput/total_tokens=1,092,864,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5693/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,093,056,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5694/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,093,248,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5695/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,093,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5696/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=1,093,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5697/500000] + train/ActionNoiseL2Loss=0.0957 + throughput/total_tokens=1,093,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5698/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=1,094,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5699/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=1,094,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5700/500000] + optim/total_grad_norm=1.443 + train/ActionNoiseL2Loss=0.1045 + throughput/total_tokens=1,094,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5701/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,094,592,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5702/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,094,784,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5703/500000] + train/ActionNoiseL2Loss=0.1104 + throughput/total_tokens=1,094,976,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5704/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=1,095,168,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5705/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=1,095,360,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5706/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,095,552,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5707/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=1,095,744,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5708/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=1,095,936,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5709/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,096,128,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5710/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,096,320,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=5711/500000] + train/ActionNoiseL2Loss=0.0313 + throughput/total_tokens=1,096,512,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5712/500000] + train/ActionNoiseL2Loss=0.0949 + throughput/total_tokens=1,096,704,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5713/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=1,096,896,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5714/500000] + train/ActionNoiseL2Loss=0.0998 + throughput/total_tokens=1,097,088,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5715/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,097,280,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5716/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,097,472,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5717/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=1,097,664,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5718/500000] + train/ActionNoiseL2Loss=0.0820 + throughput/total_tokens=1,097,856,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5719/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=1,098,048,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5720/500000] + optim/total_grad_norm=2.017 + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=1,098,240,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5721/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,098,432,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5722/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,098,624,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5723/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,098,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5724/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,099,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5725/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=1,099,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5726/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,099,392,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5727/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=1,099,584,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5728/500000] + train/ActionNoiseL2Loss=0.0388 + throughput/total_tokens=1,099,776,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5729/500000] + train/ActionNoiseL2Loss=0.1037 + throughput/total_tokens=1,099,968,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5730/500000] + train/ActionNoiseL2Loss=0.0831 + throughput/total_tokens=1,100,160,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5731/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,100,352,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5732/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=1,100,544,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5733/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=1,100,736,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5734/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=1,100,928,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5735/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,101,120,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5736/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=1,101,312,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5737/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=1,101,504,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5738/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,101,696,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5739/500000] + train/ActionNoiseL2Loss=0.0310 + throughput/total_tokens=1,101,888,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5740/500000] + optim/total_grad_norm=1.180 + train/ActionNoiseL2Loss=0.0254 + throughput/total_tokens=1,102,080,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5741/500000] + train/ActionNoiseL2Loss=0.0859 + throughput/total_tokens=1,102,272,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5742/500000] + train/ActionNoiseL2Loss=0.1073 + throughput/total_tokens=1,102,464,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5743/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=1,102,656,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5744/500000] + train/ActionNoiseL2Loss=0.0827 + throughput/total_tokens=1,102,848,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5745/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=1,103,040,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5746/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=1,103,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5747/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=1,103,424,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5748/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,103,616,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5749/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=1,103,808,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5750/500000] + train/ActionNoiseL2Loss=0.0299 + throughput/total_tokens=1,104,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5751/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,104,192,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5752/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,104,384,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5753/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=1,104,576,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5754/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,104,768,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5755/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=1,104,960,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5756/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=1,105,152,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5757/500000] + train/ActionNoiseL2Loss=0.0287 + throughput/total_tokens=1,105,344,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5758/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,105,536,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5759/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,105,728,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5760/500000] + optim/total_grad_norm=1.624 + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=1,105,920,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=5761/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=1,106,112,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5762/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=1,106,304,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5763/500000] + train/ActionNoiseL2Loss=0.1070 + throughput/total_tokens=1,106,496,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5764/500000] + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=1,106,688,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5765/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,106,880,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5766/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=1,107,072,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5767/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=1,107,264,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5768/500000] + train/ActionNoiseL2Loss=0.0899 + throughput/total_tokens=1,107,456,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5769/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=1,107,648,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5770/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,107,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5771/500000] + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=1,108,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5772/500000] + train/ActionNoiseL2Loss=0.1061 + throughput/total_tokens=1,108,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5773/500000] + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=1,108,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5774/500000] + train/ActionNoiseL2Loss=0.1708 + throughput/total_tokens=1,108,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5775/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=1,108,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5776/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=1,108,992,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5777/500000] + train/ActionNoiseL2Loss=0.0359 + throughput/total_tokens=1,109,184,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5778/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=1,109,376,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5779/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,109,568,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5780/500000] + optim/total_grad_norm=2.017 + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=1,109,760,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5781/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=1,109,952,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5782/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,110,144,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5783/500000] + train/ActionNoiseL2Loss=0.0741 + throughput/total_tokens=1,110,336,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5784/500000] + train/ActionNoiseL2Loss=0.0879 + throughput/total_tokens=1,110,528,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5785/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=1,110,720,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5786/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=1,110,912,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5787/500000] + train/ActionNoiseL2Loss=0.0899 + throughput/total_tokens=1,111,104,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5788/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,111,296,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5789/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=1,111,488,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5790/500000] + train/ActionNoiseL2Loss=0.0946 + throughput/total_tokens=1,111,680,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5791/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,111,872,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5792/500000] + train/ActionNoiseL2Loss=0.1115 + throughput/total_tokens=1,112,064,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5793/500000] + train/ActionNoiseL2Loss=0.0289 + throughput/total_tokens=1,112,256,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5794/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=1,112,448,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5795/500000] + train/ActionNoiseL2Loss=0.1009 + throughput/total_tokens=1,112,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5796/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,112,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5797/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,113,024,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5798/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=1,113,216,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5799/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,113,408,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5800/500000] + optim/total_grad_norm=1.326 + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=1,113,600,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5801/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,113,792,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5802/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=1,113,984,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5803/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,114,176,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5804/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=1,114,368,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5805/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=1,114,560,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5806/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=1,114,752,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5807/500000] + train/ActionNoiseL2Loss=0.1113 + throughput/total_tokens=1,114,944,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5808/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,115,136,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5809/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=1,115,328,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5810/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,115,520,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=5811/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,115,712,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5812/500000] + train/ActionNoiseL2Loss=0.0250 + throughput/total_tokens=1,115,904,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5813/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,116,096,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5814/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,116,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5815/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=1,116,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5816/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,116,672,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5817/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,116,864,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5818/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=1,117,056,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5819/500000] + train/ActionNoiseL2Loss=0.0940 + throughput/total_tokens=1,117,248,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5820/500000] + optim/total_grad_norm=2.395 + train/ActionNoiseL2Loss=0.1183 + throughput/total_tokens=1,117,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5821/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,117,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5822/500000] + train/ActionNoiseL2Loss=0.0900 + throughput/total_tokens=1,117,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5823/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,118,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5824/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,118,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5825/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=1,118,400,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5826/500000] + train/ActionNoiseL2Loss=0.0256 + throughput/total_tokens=1,118,592,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5827/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=1,118,784,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5828/500000] + train/ActionNoiseL2Loss=0.0992 + throughput/total_tokens=1,118,976,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5829/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,119,168,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5830/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=1,119,360,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5831/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,119,552,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5832/500000] + train/ActionNoiseL2Loss=0.1567 + throughput/total_tokens=1,119,744,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5833/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,119,936,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5834/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=1,120,128,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5835/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,120,320,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5836/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=1,120,512,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5837/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=1,120,704,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5838/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,120,896,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5839/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=1,121,088,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5840/500000] + optim/total_grad_norm=1.102 + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=1,121,280,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5841/500000] + train/ActionNoiseL2Loss=0.0986 + throughput/total_tokens=1,121,472,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5842/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,121,664,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5843/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,121,856,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5844/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,122,048,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5845/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=1,122,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5846/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=1,122,432,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5847/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=1,122,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5848/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,122,816,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5849/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=1,123,008,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5850/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,123,200,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5851/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,123,392,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5852/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=1,123,584,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5853/500000] + train/ActionNoiseL2Loss=0.0901 + throughput/total_tokens=1,123,776,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5854/500000] + train/ActionNoiseL2Loss=0.1138 + throughput/total_tokens=1,123,968,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5855/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,124,160,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5856/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,124,352,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5857/500000] + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=1,124,544,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5858/500000] + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=1,124,736,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5859/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,124,928,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5860/500000] + optim/total_grad_norm=1.450 + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=1,125,120,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=5861/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,125,312,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5862/500000] + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=1,125,504,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5863/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=1,125,696,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5864/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=1,125,888,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5865/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=1,126,080,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5866/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=1,126,272,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5867/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,126,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5868/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=1,126,656,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5869/500000] + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=1,126,848,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5870/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=1,127,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5871/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=1,127,232,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5872/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,127,424,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5873/500000] + train/ActionNoiseL2Loss=0.0259 + throughput/total_tokens=1,127,616,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5874/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,127,808,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5875/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=1,128,000,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5876/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,128,192,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5877/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=1,128,384,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5878/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,128,576,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5879/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=1,128,768,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5880/500000] + optim/total_grad_norm=1.378 + train/ActionNoiseL2Loss=0.1075 + throughput/total_tokens=1,128,960,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=5881/500000] + train/ActionNoiseL2Loss=0.1126 + throughput/total_tokens=1,129,152,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5882/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=1,129,344,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5883/500000] + train/ActionNoiseL2Loss=0.0951 + throughput/total_tokens=1,129,536,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5884/500000] + train/ActionNoiseL2Loss=0.0886 + throughput/total_tokens=1,129,728,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5885/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,129,920,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5886/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=1,130,112,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5887/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,130,304,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5888/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,130,496,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5889/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,130,688,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5890/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,130,880,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=5891/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,131,072,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5892/500000] + train/ActionNoiseL2Loss=0.1179 + throughput/total_tokens=1,131,264,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5893/500000] + train/ActionNoiseL2Loss=0.1104 + throughput/total_tokens=1,131,456,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5894/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=1,131,648,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5895/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,131,840,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5896/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=1,132,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5897/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,132,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5898/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,132,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5899/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=1,132,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5900/500000] + optim/total_grad_norm=1.638 + train/ActionNoiseL2Loss=0.1114 + throughput/total_tokens=1,132,800,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5901/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=1,132,992,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5902/500000] + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=1,133,184,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5903/500000] + train/ActionNoiseL2Loss=0.0881 + throughput/total_tokens=1,133,376,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5904/500000] + train/ActionNoiseL2Loss=0.1346 + throughput/total_tokens=1,133,568,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5905/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=1,133,760,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5906/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,133,952,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5907/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,134,144,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5908/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=1,134,336,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5909/500000] + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=1,134,528,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5910/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,134,720,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=5911/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,134,912,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5912/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,135,104,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5913/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,135,296,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5914/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=1,135,488,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5915/500000] + train/ActionNoiseL2Loss=0.0902 + throughput/total_tokens=1,135,680,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5916/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,135,872,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5917/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,136,064,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5918/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=1,136,256,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5919/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=1,136,448,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=5920/500000] + optim/total_grad_norm=1.360 + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=1,136,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5921/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,136,832,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5922/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,137,024,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5923/500000] + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=1,137,216,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5924/500000] + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=1,137,408,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5925/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,137,600,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5926/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=1,137,792,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5927/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=1,137,984,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5928/500000] + train/ActionNoiseL2Loss=0.0214 + throughput/total_tokens=1,138,176,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5929/500000] + train/ActionNoiseL2Loss=0.0388 + throughput/total_tokens=1,138,368,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5930/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=1,138,560,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5931/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=1,138,752,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5932/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,138,944,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5933/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=1,139,136,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5934/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,139,328,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5935/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,139,520,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5936/500000] + train/ActionNoiseL2Loss=0.1015 + throughput/total_tokens=1,139,712,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5937/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=1,139,904,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5938/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=1,140,096,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5939/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=1,140,288,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5940/500000] + optim/total_grad_norm=1.600 + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,140,480,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5941/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=1,140,672,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5942/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=1,140,864,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5943/500000] + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=1,141,056,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5944/500000] + train/ActionNoiseL2Loss=0.0335 + throughput/total_tokens=1,141,248,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5945/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=1,141,440,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5946/500000] + train/ActionNoiseL2Loss=0.1043 + throughput/total_tokens=1,141,632,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5947/500000] + train/ActionNoiseL2Loss=0.1268 + throughput/total_tokens=1,141,824,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5948/500000] + train/ActionNoiseL2Loss=0.0893 + throughput/total_tokens=1,142,016,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5949/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,142,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5950/500000] + train/ActionNoiseL2Loss=0.1021 + throughput/total_tokens=1,142,400,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5951/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=1,142,592,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5952/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,142,784,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5953/500000] + train/ActionNoiseL2Loss=0.0249 + throughput/total_tokens=1,142,976,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5954/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,143,168,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5955/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,143,360,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5956/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,143,552,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5957/500000] + train/ActionNoiseL2Loss=0.0297 + throughput/total_tokens=1,143,744,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5958/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=1,143,936,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5959/500000] + train/ActionNoiseL2Loss=0.1024 + throughput/total_tokens=1,144,128,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5960/500000] + optim/total_grad_norm=1.480 + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=1,144,320,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=5961/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=1,144,512,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5962/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=1,144,704,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5963/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=1,144,896,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5964/500000] + train/ActionNoiseL2Loss=0.0269 + throughput/total_tokens=1,145,088,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5965/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,145,280,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5966/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,145,472,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5967/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=1,145,664,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=5968/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,145,856,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5969/500000] + train/ActionNoiseL2Loss=0.0286 + throughput/total_tokens=1,146,048,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5970/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,146,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5971/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=1,146,432,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5972/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,146,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5973/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=1,146,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5974/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,147,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5975/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,147,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5976/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=1,147,392,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5977/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=1,147,584,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5978/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,147,776,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5979/500000] + train/ActionNoiseL2Loss=0.0788 + throughput/total_tokens=1,147,968,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5980/500000] + optim/total_grad_norm=1.863 + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,148,160,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=5981/500000] + train/ActionNoiseL2Loss=0.0905 + throughput/total_tokens=1,148,352,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5982/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=1,148,544,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5983/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,148,736,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5984/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,148,928,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=5985/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=1,149,120,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5986/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=1,149,312,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5987/500000] + train/ActionNoiseL2Loss=0.0411 + throughput/total_tokens=1,149,504,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5988/500000] + train/ActionNoiseL2Loss=0.0904 + throughput/total_tokens=1,149,696,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5989/500000] + train/ActionNoiseL2Loss=0.0956 + throughput/total_tokens=1,149,888,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5990/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,150,080,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=5991/500000] + train/ActionNoiseL2Loss=0.1136 + throughput/total_tokens=1,150,272,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5992/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,150,464,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5993/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=1,150,656,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5994/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=1,150,848,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5995/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=1,151,040,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5996/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=1,151,232,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5997/500000] + train/ActionNoiseL2Loss=0.0309 + throughput/total_tokens=1,151,424,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5998/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=1,151,616,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5999/500000] + train/ActionNoiseL2Loss=0.1060 + throughput/total_tokens=1,151,808,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6000/500000] + optim/total_grad_norm=1.447 + train/ActionNoiseL2Loss=0.0929 + throughput/total_tokens=1,152,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +10/07 [04:15:37] INFO | >> Saving config... checkpoint.py:608 +10/07 [04:16:11] INFO | >> Saving model state... checkpoint.py:796 +10/07 [04:17:22] INFO | >> Saving optim state... checkpoint.py:811 +10/07 [04:19:01] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=6001/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=1,152,192,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=6002/500000] + train/ActionNoiseL2Loss=0.0901 + throughput/total_tokens=1,152,384,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6003/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=1,152,576,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6004/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,152,768,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=6005/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=1,152,960,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6006/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=1,153,152,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6007/500000] + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=1,153,344,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6008/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=1,153,536,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6009/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=1,153,728,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6010/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=1,153,920,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=6011/500000] + train/ActionNoiseL2Loss=0.0410 + throughput/total_tokens=1,154,112,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6012/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,154,304,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6013/500000] + train/ActionNoiseL2Loss=0.1031 + throughput/total_tokens=1,154,496,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6014/500000] + train/ActionNoiseL2Loss=0.0391 + throughput/total_tokens=1,154,688,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6015/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,154,880,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6016/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,155,072,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6017/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=1,155,264,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6018/500000] + train/ActionNoiseL2Loss=0.0978 + throughput/total_tokens=1,155,456,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6019/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=1,155,648,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6020/500000] + optim/total_grad_norm=1.303 + train/ActionNoiseL2Loss=0.1025 + throughput/total_tokens=1,155,840,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=6021/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=1,156,032,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6022/500000] + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=1,156,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6023/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=1,156,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6024/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=1,156,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6025/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,156,800,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6026/500000] + train/ActionNoiseL2Loss=0.1009 + throughput/total_tokens=1,156,992,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6027/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,157,184,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6028/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,157,376,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6029/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=1,157,568,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6030/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=1,157,760,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6031/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=1,157,952,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6032/500000] + train/ActionNoiseL2Loss=0.0833 + throughput/total_tokens=1,158,144,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6033/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=1,158,336,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6034/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,158,528,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6035/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,158,720,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6036/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=1,158,912,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6037/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,159,104,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6038/500000] + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=1,159,296,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6039/500000] + train/ActionNoiseL2Loss=0.1372 + throughput/total_tokens=1,159,488,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6040/500000] + optim/total_grad_norm=1.166 + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,159,680,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6041/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,159,872,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6042/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=1,160,064,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6043/500000] + train/ActionNoiseL2Loss=0.0306 + throughput/total_tokens=1,160,256,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6044/500000] + train/ActionNoiseL2Loss=0.0893 + throughput/total_tokens=1,160,448,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6045/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,160,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6046/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=1,160,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6047/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,161,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6048/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=1,161,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6049/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=1,161,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6050/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=1,161,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6051/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,161,792,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6052/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=1,161,984,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6053/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,162,176,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6054/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=1,162,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6055/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=1,162,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6056/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=1,162,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6057/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,162,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6058/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=1,163,136,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6059/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=1,163,328,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6060/500000] + optim/total_grad_norm=1.507 + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,163,520,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=6061/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,163,712,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6062/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=1,163,904,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6063/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,164,096,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6064/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=1,164,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6065/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,164,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6066/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=1,164,672,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6067/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=1,164,864,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6068/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=1,165,056,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6069/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,165,248,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6070/500000] + train/ActionNoiseL2Loss=0.1077 + throughput/total_tokens=1,165,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6071/500000] + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=1,165,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6072/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,165,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6073/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=1,166,016,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6074/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,166,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6075/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,166,400,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6076/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,166,592,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6077/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,166,784,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6078/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,166,976,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6079/500000] + train/ActionNoiseL2Loss=0.0310 + throughput/total_tokens=1,167,168,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6080/500000] + optim/total_grad_norm=2.080 + train/ActionNoiseL2Loss=0.1068 + throughput/total_tokens=1,167,360,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6081/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=1,167,552,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6082/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=1,167,744,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6083/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,167,936,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6084/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=1,168,128,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6085/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=1,168,320,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6086/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=1,168,512,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6087/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,168,704,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6088/500000] + train/ActionNoiseL2Loss=0.0313 + throughput/total_tokens=1,168,896,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6089/500000] + train/ActionNoiseL2Loss=0.0963 + throughput/total_tokens=1,169,088,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6090/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=1,169,280,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=6091/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=1,169,472,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6092/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,169,664,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6093/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=1,169,856,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6094/500000] + train/ActionNoiseL2Loss=0.0385 + throughput/total_tokens=1,170,048,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6095/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=1,170,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6096/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,170,432,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6097/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,170,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6098/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,170,816,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6099/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=1,171,008,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6100/500000] + optim/total_grad_norm=1.137 + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=1,171,200,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6101/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,171,392,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6102/500000] + train/ActionNoiseL2Loss=0.0335 + throughput/total_tokens=1,171,584,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6103/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=1,171,776,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6104/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,171,968,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6105/500000] + train/ActionNoiseL2Loss=0.0983 + throughput/total_tokens=1,172,160,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6106/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=1,172,352,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6107/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=1,172,544,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6108/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=1,172,736,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6109/500000] + train/ActionNoiseL2Loss=0.1229 + throughput/total_tokens=1,172,928,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6110/500000] + train/ActionNoiseL2Loss=0.0833 + throughput/total_tokens=1,173,120,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=6111/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=1,173,312,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6112/500000] + train/ActionNoiseL2Loss=0.1117 + throughput/total_tokens=1,173,504,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6113/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=1,173,696,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6114/500000] + train/ActionNoiseL2Loss=0.1481 + throughput/total_tokens=1,173,888,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6115/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,174,080,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6116/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,174,272,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6117/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,174,464,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6118/500000] + train/ActionNoiseL2Loss=0.1555 + throughput/total_tokens=1,174,656,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6119/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,174,848,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6120/500000] + optim/total_grad_norm=1.735 + train/ActionNoiseL2Loss=0.0823 + throughput/total_tokens=1,175,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6121/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=1,175,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6122/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=1,175,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6123/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,175,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6124/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,175,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6125/500000] + train/ActionNoiseL2Loss=0.0976 + throughput/total_tokens=1,176,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6126/500000] + train/ActionNoiseL2Loss=0.0300 + throughput/total_tokens=1,176,192,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6127/500000] + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=1,176,384,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6128/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,176,576,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6129/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,176,768,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6130/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,176,960,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6131/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=1,177,152,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6132/500000] + train/ActionNoiseL2Loss=0.0176 + throughput/total_tokens=1,177,344,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6133/500000] + train/ActionNoiseL2Loss=0.1002 + throughput/total_tokens=1,177,536,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6134/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=1,177,728,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6135/500000] + train/ActionNoiseL2Loss=0.0993 + throughput/total_tokens=1,177,920,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6136/500000] + train/ActionNoiseL2Loss=0.0314 + throughput/total_tokens=1,178,112,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6137/500000] + train/ActionNoiseL2Loss=0.1720 + throughput/total_tokens=1,178,304,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6138/500000] + train/ActionNoiseL2Loss=0.0886 + throughput/total_tokens=1,178,496,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6139/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=1,178,688,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6140/500000] + optim/total_grad_norm=1.639 + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,178,880,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6141/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=1,179,072,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6142/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,179,264,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6143/500000] + train/ActionNoiseL2Loss=0.0772 + throughput/total_tokens=1,179,456,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6144/500000] + train/ActionNoiseL2Loss=0.0411 + throughput/total_tokens=1,179,648,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6145/500000] + train/ActionNoiseL2Loss=0.1242 + throughput/total_tokens=1,179,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6146/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=1,180,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6147/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=1,180,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6148/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=1,180,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6149/500000] + train/ActionNoiseL2Loss=0.0932 + throughput/total_tokens=1,180,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6150/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=1,180,800,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6151/500000] + train/ActionNoiseL2Loss=0.0992 + throughput/total_tokens=1,180,992,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6152/500000] + train/ActionNoiseL2Loss=0.1170 + throughput/total_tokens=1,181,184,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6153/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=1,181,376,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6154/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=1,181,568,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6155/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,181,760,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6156/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=1,181,952,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6157/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,182,144,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6158/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,182,336,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6159/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,182,528,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6160/500000] + optim/total_grad_norm=2.665 + train/ActionNoiseL2Loss=0.1558 + throughput/total_tokens=1,182,720,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=6161/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=1,182,912,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6162/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,183,104,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6163/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,183,296,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6164/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=1,183,488,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6165/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,183,680,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6166/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,183,872,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6167/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=1,184,064,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6168/500000] + train/ActionNoiseL2Loss=0.1673 + throughput/total_tokens=1,184,256,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6169/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=1,184,448,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6170/500000] + train/ActionNoiseL2Loss=0.0267 + throughput/total_tokens=1,184,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6171/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,184,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6172/500000] + train/ActionNoiseL2Loss=0.1000 + throughput/total_tokens=1,185,024,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6173/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=1,185,216,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6174/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,185,408,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6175/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=1,185,600,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6176/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=1,185,792,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6177/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,185,984,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6178/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=1,186,176,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6179/500000] + train/ActionNoiseL2Loss=0.1100 + throughput/total_tokens=1,186,368,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6180/500000] + optim/total_grad_norm=2.005 + train/ActionNoiseL2Loss=0.1545 + throughput/total_tokens=1,186,560,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6181/500000] + train/ActionNoiseL2Loss=0.1078 + throughput/total_tokens=1,186,752,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6182/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,186,944,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6183/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=1,187,136,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6184/500000] + train/ActionNoiseL2Loss=0.0968 + throughput/total_tokens=1,187,328,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6185/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=1,187,520,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6186/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=1,187,712,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6187/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=1,187,904,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6188/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=1,188,096,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6189/500000] + train/ActionNoiseL2Loss=0.1353 + throughput/total_tokens=1,188,288,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6190/500000] + train/ActionNoiseL2Loss=0.0877 + throughput/total_tokens=1,188,480,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6191/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=1,188,672,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6192/500000] + train/ActionNoiseL2Loss=0.0250 + throughput/total_tokens=1,188,864,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6193/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,189,056,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6194/500000] + train/ActionNoiseL2Loss=0.1408 + throughput/total_tokens=1,189,248,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6195/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=1,189,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6196/500000] + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=1,189,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6197/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,189,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6198/500000] + train/ActionNoiseL2Loss=0.1140 + throughput/total_tokens=1,190,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6199/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,190,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6200/500000] + optim/total_grad_norm=0.8752 + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,190,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6201/500000] + train/ActionNoiseL2Loss=0.1167 + throughput/total_tokens=1,190,592,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6202/500000] + train/ActionNoiseL2Loss=0.0981 + throughput/total_tokens=1,190,784,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6203/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=1,190,976,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6204/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=1,191,168,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6205/500000] + train/ActionNoiseL2Loss=0.1106 + throughput/total_tokens=1,191,360,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6206/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=1,191,552,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6207/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,191,744,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6208/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,191,936,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6209/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,192,128,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6210/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=1,192,320,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=6211/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,192,512,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6212/500000] + train/ActionNoiseL2Loss=0.1132 + throughput/total_tokens=1,192,704,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6213/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=1,192,896,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6214/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=1,193,088,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6215/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,193,280,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6216/500000] + train/ActionNoiseL2Loss=0.0316 + throughput/total_tokens=1,193,472,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6217/500000] + train/ActionNoiseL2Loss=0.1297 + throughput/total_tokens=1,193,664,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6218/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,193,856,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6219/500000] + train/ActionNoiseL2Loss=0.0942 + throughput/total_tokens=1,194,048,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6220/500000] + optim/total_grad_norm=1.262 + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,194,240,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6221/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=1,194,432,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6222/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,194,624,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6223/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=1,194,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6224/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,195,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6225/500000] + train/ActionNoiseL2Loss=0.1007 + throughput/total_tokens=1,195,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6226/500000] + train/ActionNoiseL2Loss=0.1180 + throughput/total_tokens=1,195,392,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6227/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,195,584,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6228/500000] + train/ActionNoiseL2Loss=0.1279 + throughput/total_tokens=1,195,776,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6229/500000] + train/ActionNoiseL2Loss=0.0752 + throughput/total_tokens=1,195,968,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6230/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=1,196,160,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6231/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=1,196,352,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6232/500000] + train/ActionNoiseL2Loss=0.0827 + throughput/total_tokens=1,196,544,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6233/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,196,736,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6234/500000] + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=1,196,928,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6235/500000] + train/ActionNoiseL2Loss=0.1094 + throughput/total_tokens=1,197,120,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6236/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,197,312,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6237/500000] + train/ActionNoiseL2Loss=0.0940 + throughput/total_tokens=1,197,504,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6238/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,197,696,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6239/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=1,197,888,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6240/500000] + optim/total_grad_norm=1.350 + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=1,198,080,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6241/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,198,272,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6242/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,198,464,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6243/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=1,198,656,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6244/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,198,848,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6245/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=1,199,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6246/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,199,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6247/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,199,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6248/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=1,199,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6249/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=1,199,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6250/500000] + train/ActionNoiseL2Loss=0.0306 + throughput/total_tokens=1,200,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6251/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,200,192,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6252/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=1,200,384,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6253/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=1,200,576,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6254/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=1,200,768,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6255/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=1,200,960,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6256/500000] + train/ActionNoiseL2Loss=0.0973 + throughput/total_tokens=1,201,152,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6257/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=1,201,344,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6258/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,201,536,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6259/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=1,201,728,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6260/500000] + optim/total_grad_norm=1.171 + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,201,920,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=6261/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=1,202,112,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6262/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,202,304,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6263/500000] + train/ActionNoiseL2Loss=0.0363 + throughput/total_tokens=1,202,496,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6264/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=1,202,688,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6265/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,202,880,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6266/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,203,072,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6267/500000] + train/ActionNoiseL2Loss=0.0923 + throughput/total_tokens=1,203,264,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6268/500000] + train/ActionNoiseL2Loss=0.0874 + throughput/total_tokens=1,203,456,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6269/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,203,648,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6270/500000] + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=1,203,840,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6271/500000] + train/ActionNoiseL2Loss=0.0884 + throughput/total_tokens=1,204,032,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6272/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,204,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6273/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=1,204,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6274/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,204,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6275/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=1,204,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6276/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=1,204,992,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6277/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,205,184,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6278/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=1,205,376,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6279/500000] + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=1,205,568,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6280/500000] + optim/total_grad_norm=1.190 + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,205,760,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6281/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=1,205,952,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6282/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=1,206,144,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6283/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,206,336,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6284/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,206,528,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6285/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=1,206,720,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6286/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,206,912,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6287/500000] + train/ActionNoiseL2Loss=0.1515 + throughput/total_tokens=1,207,104,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6288/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,207,296,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6289/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=1,207,488,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6290/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=1,207,680,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6291/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,207,872,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6292/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=1,208,064,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6293/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,208,256,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6294/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=1,208,448,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6295/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=1,208,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6296/500000] + train/ActionNoiseL2Loss=0.0255 + throughput/total_tokens=1,208,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6297/500000] + train/ActionNoiseL2Loss=0.1037 + throughput/total_tokens=1,209,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6298/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,209,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6299/500000] + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=1,209,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6300/500000] + optim/total_grad_norm=1.616 + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=1,209,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6301/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=1,209,792,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6302/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=1,209,984,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6303/500000] + train/ActionNoiseL2Loss=0.1333 + throughput/total_tokens=1,210,176,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6304/500000] + train/ActionNoiseL2Loss=0.0843 + throughput/total_tokens=1,210,368,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6305/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,210,560,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6306/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=1,210,752,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6307/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,210,944,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6308/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=1,211,136,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6309/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,211,328,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6310/500000] + train/ActionNoiseL2Loss=0.1208 + throughput/total_tokens=1,211,520,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=6311/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,211,712,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6312/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,211,904,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6313/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,212,096,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6314/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,212,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6315/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,212,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6316/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,212,672,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6317/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=1,212,864,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6318/500000] + train/ActionNoiseL2Loss=0.0935 + throughput/total_tokens=1,213,056,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6319/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=1,213,248,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6320/500000] + optim/total_grad_norm=1.328 + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=1,213,440,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6321/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=1,213,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6322/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,213,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6323/500000] + train/ActionNoiseL2Loss=0.1129 + throughput/total_tokens=1,214,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6324/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=1,214,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6325/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,214,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6326/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=1,214,592,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6327/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=1,214,784,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6328/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=1,214,976,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6329/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=1,215,168,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6330/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=1,215,360,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=6331/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,215,552,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6332/500000] + train/ActionNoiseL2Loss=0.0292 + throughput/total_tokens=1,215,744,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6333/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,215,936,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6334/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,216,128,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6335/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,216,320,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6336/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,216,512,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6337/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=1,216,704,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6338/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,216,896,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6339/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=1,217,088,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6340/500000] + optim/total_grad_norm=1.859 + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=1,217,280,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=6341/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=1,217,472,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6342/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,217,664,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6343/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=1,217,856,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6344/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,218,048,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6345/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=1,218,240,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6346/500000] + train/ActionNoiseL2Loss=0.1255 + throughput/total_tokens=1,218,432,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6347/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=1,218,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6348/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=1,218,816,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6349/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,219,008,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6350/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=1,219,200,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6351/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=1,219,392,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6352/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,219,584,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6353/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=1,219,776,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6354/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=1,219,968,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6355/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=1,220,160,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6356/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,220,352,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6357/500000] + train/ActionNoiseL2Loss=0.0823 + throughput/total_tokens=1,220,544,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6358/500000] + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=1,220,736,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6359/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,220,928,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6360/500000] + optim/total_grad_norm=3.087 + train/ActionNoiseL2Loss=0.1381 + throughput/total_tokens=1,221,120,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=6361/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=1,221,312,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6362/500000] + train/ActionNoiseL2Loss=0.0338 + throughput/total_tokens=1,221,504,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6363/500000] + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=1,221,696,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6364/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,221,888,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6365/500000] + train/ActionNoiseL2Loss=0.1168 + throughput/total_tokens=1,222,080,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6366/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,222,272,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6367/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,222,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6368/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=1,222,656,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6369/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,222,848,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6370/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,223,040,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6371/500000] + train/ActionNoiseL2Loss=0.0987 + throughput/total_tokens=1,223,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6372/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=1,223,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6373/500000] + train/ActionNoiseL2Loss=0.1266 + throughput/total_tokens=1,223,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6374/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,223,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6375/500000] + train/ActionNoiseL2Loss=0.0901 + throughput/total_tokens=1,224,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6376/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,224,192,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6377/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,224,384,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6378/500000] + train/ActionNoiseL2Loss=0.0827 + throughput/total_tokens=1,224,576,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6379/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=1,224,768,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6380/500000] + optim/total_grad_norm=1.538 + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=1,224,960,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6381/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,225,152,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6382/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,225,344,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6383/500000] + train/ActionNoiseL2Loss=0.0917 + throughput/total_tokens=1,225,536,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6384/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=1,225,728,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6385/500000] + train/ActionNoiseL2Loss=0.0263 + throughput/total_tokens=1,225,920,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6386/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,226,112,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6387/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=1,226,304,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6388/500000] + train/ActionNoiseL2Loss=0.0337 + throughput/total_tokens=1,226,496,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6389/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,226,688,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6390/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=1,226,880,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=6391/500000] + train/ActionNoiseL2Loss=0.1083 + throughput/total_tokens=1,227,072,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6392/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,227,264,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6393/500000] + train/ActionNoiseL2Loss=0.0853 + throughput/total_tokens=1,227,456,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6394/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,227,648,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6395/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=1,227,840,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6396/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=1,228,032,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6397/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,228,224,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6398/500000] + train/ActionNoiseL2Loss=0.1027 + throughput/total_tokens=1,228,416,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6399/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=1,228,608,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6400/500000] + optim/total_grad_norm=1.676 + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=1,228,800,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=6401/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=1,228,992,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6402/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,229,184,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6403/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,229,376,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6404/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=1,229,568,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6405/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=1,229,760,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6406/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,229,952,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6407/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=1,230,144,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6408/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=1,230,336,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6409/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,230,528,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6410/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=1,230,720,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=6411/500000] + train/ActionNoiseL2Loss=0.1012 + throughput/total_tokens=1,230,912,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6412/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=1,231,104,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6413/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=1,231,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6414/500000] + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=1,231,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6415/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,231,680,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6416/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=1,231,872,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6417/500000] + train/ActionNoiseL2Loss=0.0932 + throughput/total_tokens=1,232,064,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6418/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=1,232,256,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6419/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,232,448,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6420/500000] + optim/total_grad_norm=1.366 + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,232,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6421/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,232,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6422/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=1,233,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6423/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,233,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6424/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,233,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6425/500000] + train/ActionNoiseL2Loss=0.0223 + throughput/total_tokens=1,233,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6426/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=1,233,792,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6427/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,233,984,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6428/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,234,176,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6429/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=1,234,368,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6430/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=1,234,560,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6431/500000] + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=1,234,752,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6432/500000] + train/ActionNoiseL2Loss=0.0946 + throughput/total_tokens=1,234,944,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6433/500000] + train/ActionNoiseL2Loss=0.0946 + throughput/total_tokens=1,235,136,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6434/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=1,235,328,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6435/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=1,235,520,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6436/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=1,235,712,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6437/500000] + train/ActionNoiseL2Loss=0.0335 + throughput/total_tokens=1,235,904,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6438/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,236,096,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6439/500000] + train/ActionNoiseL2Loss=0.0278 + throughput/total_tokens=1,236,288,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6440/500000] + optim/total_grad_norm=1.384 + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,236,480,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6441/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,236,672,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6442/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,236,864,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6443/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=1,237,056,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6444/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=1,237,248,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6445/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=1,237,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6446/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=1,237,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6447/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,237,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6448/500000] + train/ActionNoiseL2Loss=0.0944 + throughput/total_tokens=1,238,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6449/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=1,238,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6450/500000] + train/ActionNoiseL2Loss=0.1046 + throughput/total_tokens=1,238,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6451/500000] + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=1,238,592,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6452/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=1,238,784,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6453/500000] + train/ActionNoiseL2Loss=0.0926 + throughput/total_tokens=1,238,976,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6454/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,239,168,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6455/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=1,239,360,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6456/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,239,552,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6457/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=1,239,744,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6458/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,239,936,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6459/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=1,240,128,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6460/500000] + optim/total_grad_norm=1.498 + train/ActionNoiseL2Loss=0.1224 + throughput/total_tokens=1,240,320,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=6461/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=1,240,512,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6462/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=1,240,704,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6463/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=1,240,896,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6464/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=1,241,088,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6465/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=1,241,280,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6466/500000] + train/ActionNoiseL2Loss=0.1315 + throughput/total_tokens=1,241,472,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6467/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=1,241,664,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6468/500000] + train/ActionNoiseL2Loss=0.0330 + throughput/total_tokens=1,241,856,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6469/500000] + train/ActionNoiseL2Loss=0.1148 + throughput/total_tokens=1,242,048,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6470/500000] + train/ActionNoiseL2Loss=0.0959 + throughput/total_tokens=1,242,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=6471/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=1,242,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6472/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,242,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6473/500000] + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=1,242,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6474/500000] + train/ActionNoiseL2Loss=0.1401 + throughput/total_tokens=1,243,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6475/500000] + train/ActionNoiseL2Loss=0.0408 + throughput/total_tokens=1,243,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6476/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,243,392,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6477/500000] + train/ActionNoiseL2Loss=0.0282 + throughput/total_tokens=1,243,584,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6478/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,243,776,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6479/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,243,968,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6480/500000] + optim/total_grad_norm=0.8993 + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,244,160,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6481/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=1,244,352,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6482/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=1,244,544,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6483/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=1,244,736,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6484/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,244,928,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6485/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,245,120,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6486/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=1,245,312,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6487/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=1,245,504,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6488/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=1,245,696,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6489/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,245,888,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6490/500000] + train/ActionNoiseL2Loss=0.0258 + throughput/total_tokens=1,246,080,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6491/500000] + train/ActionNoiseL2Loss=0.1212 + throughput/total_tokens=1,246,272,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6492/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=1,246,464,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6493/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,246,656,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6494/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,246,848,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6495/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=1,247,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6496/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=1,247,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6497/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,247,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6498/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,247,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6499/500000] + train/ActionNoiseL2Loss=0.0355 + throughput/total_tokens=1,247,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6500/500000] + optim/total_grad_norm=1.194 + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,248,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +10/07 [07:13:25] INFO | >> Saving config... checkpoint.py:608 +10/07 [07:13:59] INFO | >> Saving model state... checkpoint.py:796 +10/07 [07:15:12] INFO | >> Saving optim state... checkpoint.py:811 +10/07 [07:16:38] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=6501/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=1,248,192,000 + throughput/device/tokens_per_second=1,194 + throughput/device/batches_per_second=0.0498 +[step=6502/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,248,384,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6503/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=1,248,576,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=6504/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=1,248,768,000 + throughput/device/tokens_per_second=1,166 + throughput/device/batches_per_second=0.0486 +[step=6505/500000] + train/ActionNoiseL2Loss=0.1074 + throughput/total_tokens=1,248,960,000 + throughput/device/tokens_per_second=1,164 + throughput/device/batches_per_second=0.0485 +[step=6506/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=1,249,152,000 + throughput/device/tokens_per_second=1,163 + throughput/device/batches_per_second=0.0485 +[step=6507/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=1,249,344,000 + throughput/device/tokens_per_second=1,163 + throughput/device/batches_per_second=0.0485 +[step=6508/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=1,249,536,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=6509/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,249,728,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=6510/500000] + train/ActionNoiseL2Loss=0.0820 + throughput/total_tokens=1,249,920,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=6511/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=1,250,112,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6512/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=1,250,304,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6513/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=1,250,496,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6514/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,250,688,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6515/500000] + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=1,250,880,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6516/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,251,072,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6517/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,251,264,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6518/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=1,251,456,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6519/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=1,251,648,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=6520/500000] + optim/total_grad_norm=1.465 + train/ActionNoiseL2Loss=0.0984 + throughput/total_tokens=1,251,840,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6521/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,252,032,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6522/500000] + train/ActionNoiseL2Loss=0.0385 + throughput/total_tokens=1,252,224,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6523/500000] + train/ActionNoiseL2Loss=0.0339 + throughput/total_tokens=1,252,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6524/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=1,252,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6525/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=1,252,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6526/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,252,992,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6527/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,253,184,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6528/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,253,376,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6529/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=1,253,568,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6530/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,253,760,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=6531/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,253,952,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6532/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=1,254,144,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6533/500000] + train/ActionNoiseL2Loss=0.0826 + throughput/total_tokens=1,254,336,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6534/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,254,528,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6535/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=1,254,720,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6536/500000] + train/ActionNoiseL2Loss=0.1409 + throughput/total_tokens=1,254,912,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6537/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=1,255,104,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6538/500000] + train/ActionNoiseL2Loss=0.1047 + throughput/total_tokens=1,255,296,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6539/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,255,488,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6540/500000] + optim/total_grad_norm=1.337 + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,255,680,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6541/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=1,255,872,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6542/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,256,064,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6543/500000] + train/ActionNoiseL2Loss=0.0257 + throughput/total_tokens=1,256,256,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6544/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=1,256,448,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6545/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=1,256,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6546/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=1,256,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6547/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=1,257,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6548/500000] + train/ActionNoiseL2Loss=0.0194 + throughput/total_tokens=1,257,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6549/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,257,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6550/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=1,257,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6551/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=1,257,792,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6552/500000] + train/ActionNoiseL2Loss=0.1031 + throughput/total_tokens=1,257,984,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6553/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=1,258,176,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6554/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=1,258,368,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6555/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=1,258,560,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6556/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=1,258,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6557/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,258,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6558/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=1,259,136,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6559/500000] + train/ActionNoiseL2Loss=0.1151 + throughput/total_tokens=1,259,328,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6560/500000] + optim/total_grad_norm=2.007 + train/ActionNoiseL2Loss=0.1229 + throughput/total_tokens=1,259,520,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=6561/500000] + train/ActionNoiseL2Loss=0.1359 + throughput/total_tokens=1,259,712,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6562/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,259,904,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6563/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,260,096,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6564/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=1,260,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6565/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=1,260,480,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6566/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,260,672,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6567/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=1,260,864,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6568/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,261,056,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6569/500000] + train/ActionNoiseL2Loss=0.0281 + throughput/total_tokens=1,261,248,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6570/500000] + train/ActionNoiseL2Loss=0.0337 + throughput/total_tokens=1,261,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6571/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=1,261,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6572/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,261,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6573/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,262,016,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6574/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=1,262,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6575/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,262,400,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6576/500000] + train/ActionNoiseL2Loss=0.0851 + throughput/total_tokens=1,262,592,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6577/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=1,262,784,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6578/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,262,976,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6579/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,263,168,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6580/500000] + optim/total_grad_norm=1.360 + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=1,263,360,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6581/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=1,263,552,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6582/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=1,263,744,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6583/500000] + train/ActionNoiseL2Loss=0.0299 + throughput/total_tokens=1,263,936,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6584/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,264,128,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6585/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=1,264,320,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6586/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=1,264,512,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6587/500000] + train/ActionNoiseL2Loss=0.0331 + throughput/total_tokens=1,264,704,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6588/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,264,896,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6589/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,265,088,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6590/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=1,265,280,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6591/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=1,265,472,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6592/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,265,664,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6593/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=1,265,856,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6594/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=1,266,048,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6595/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,266,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6596/500000] + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=1,266,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6597/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=1,266,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6598/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,266,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6599/500000] + train/ActionNoiseL2Loss=0.0973 + throughput/total_tokens=1,267,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6600/500000] + optim/total_grad_norm=1.798 + train/ActionNoiseL2Loss=0.1067 + throughput/total_tokens=1,267,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6601/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=1,267,392,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6602/500000] + train/ActionNoiseL2Loss=0.1061 + throughput/total_tokens=1,267,584,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6603/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,267,776,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6604/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=1,267,968,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6605/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,268,160,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6606/500000] + train/ActionNoiseL2Loss=0.0884 + throughput/total_tokens=1,268,352,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6607/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=1,268,544,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6608/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,268,736,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6609/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=1,268,928,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6610/500000] + train/ActionNoiseL2Loss=0.0344 + throughput/total_tokens=1,269,120,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=6611/500000] + train/ActionNoiseL2Loss=0.0949 + throughput/total_tokens=1,269,312,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6612/500000] + train/ActionNoiseL2Loss=0.0316 + throughput/total_tokens=1,269,504,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6613/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=1,269,696,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6614/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,269,888,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6615/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=1,270,080,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6616/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=1,270,272,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6617/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,270,464,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6618/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,270,656,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6619/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,270,848,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6620/500000] + optim/total_grad_norm=1.050 + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,271,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6621/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=1,271,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6622/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=1,271,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6623/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,271,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6624/500000] + train/ActionNoiseL2Loss=0.0772 + throughput/total_tokens=1,271,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6625/500000] + train/ActionNoiseL2Loss=0.1118 + throughput/total_tokens=1,272,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6626/500000] + train/ActionNoiseL2Loss=0.1126 + throughput/total_tokens=1,272,192,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6627/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=1,272,384,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6628/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=1,272,576,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6629/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,272,768,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6630/500000] + train/ActionNoiseL2Loss=0.0300 + throughput/total_tokens=1,272,960,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6631/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,273,152,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6632/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,273,344,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6633/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,273,536,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6634/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=1,273,728,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6635/500000] + train/ActionNoiseL2Loss=0.0344 + throughput/total_tokens=1,273,920,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6636/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,274,112,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6637/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=1,274,304,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6638/500000] + train/ActionNoiseL2Loss=0.0256 + throughput/total_tokens=1,274,496,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6639/500000] + train/ActionNoiseL2Loss=0.0904 + throughput/total_tokens=1,274,688,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6640/500000] + optim/total_grad_norm=1.297 + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,274,880,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6641/500000] + train/ActionNoiseL2Loss=0.1032 + throughput/total_tokens=1,275,072,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6642/500000] + train/ActionNoiseL2Loss=0.0207 + throughput/total_tokens=1,275,264,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6643/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,275,456,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6644/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=1,275,648,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6645/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,275,840,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6646/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,276,032,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6647/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,276,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6648/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,276,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6649/500000] + train/ActionNoiseL2Loss=0.0871 + throughput/total_tokens=1,276,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6650/500000] + train/ActionNoiseL2Loss=0.0345 + throughput/total_tokens=1,276,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6651/500000] + train/ActionNoiseL2Loss=0.0965 + throughput/total_tokens=1,276,992,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6652/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=1,277,184,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6653/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=1,277,376,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6654/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,277,568,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6655/500000] + train/ActionNoiseL2Loss=0.0198 + throughput/total_tokens=1,277,760,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6656/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,277,952,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6657/500000] + train/ActionNoiseL2Loss=0.0329 + throughput/total_tokens=1,278,144,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6658/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,278,336,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6659/500000] + train/ActionNoiseL2Loss=0.1179 + throughput/total_tokens=1,278,528,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6660/500000] + optim/total_grad_norm=1.290 + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=1,278,720,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=6661/500000] + train/ActionNoiseL2Loss=0.1174 + throughput/total_tokens=1,278,912,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6662/500000] + train/ActionNoiseL2Loss=0.0314 + throughput/total_tokens=1,279,104,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6663/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,279,296,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6664/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,279,488,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6665/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,279,680,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6666/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=1,279,872,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6667/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,280,064,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6668/500000] + train/ActionNoiseL2Loss=0.0987 + throughput/total_tokens=1,280,256,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6669/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=1,280,448,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6670/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=1,280,640,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6671/500000] + train/ActionNoiseL2Loss=0.0410 + throughput/total_tokens=1,280,832,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6672/500000] + train/ActionNoiseL2Loss=0.0965 + throughput/total_tokens=1,281,024,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6673/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=1,281,216,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6674/500000] + train/ActionNoiseL2Loss=0.0408 + throughput/total_tokens=1,281,408,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6675/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,281,600,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6676/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,281,792,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6677/500000] + train/ActionNoiseL2Loss=0.0946 + throughput/total_tokens=1,281,984,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6678/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=1,282,176,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6679/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=1,282,368,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6680/500000] + optim/total_grad_norm=1.790 + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=1,282,560,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6681/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=1,282,752,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6682/500000] + train/ActionNoiseL2Loss=0.0927 + throughput/total_tokens=1,282,944,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6683/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,283,136,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6684/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=1,283,328,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6685/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=1,283,520,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6686/500000] + train/ActionNoiseL2Loss=0.1116 + throughput/total_tokens=1,283,712,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6687/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=1,283,904,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6688/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=1,284,096,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6689/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=1,284,288,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6690/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=1,284,480,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6691/500000] + train/ActionNoiseL2Loss=0.0264 + throughput/total_tokens=1,284,672,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6692/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=1,284,864,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6693/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,285,056,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6694/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,285,248,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6695/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=1,285,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6696/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,285,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6697/500000] + train/ActionNoiseL2Loss=0.1400 + throughput/total_tokens=1,285,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6698/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,286,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6699/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=1,286,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6700/500000] + optim/total_grad_norm=2.355 + train/ActionNoiseL2Loss=0.0785 + throughput/total_tokens=1,286,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6701/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=1,286,592,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6702/500000] + train/ActionNoiseL2Loss=0.1175 + throughput/total_tokens=1,286,784,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6703/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=1,286,976,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6704/500000] + train/ActionNoiseL2Loss=0.0363 + throughput/total_tokens=1,287,168,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6705/500000] + train/ActionNoiseL2Loss=0.1038 + throughput/total_tokens=1,287,360,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6706/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,287,552,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6707/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,287,744,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6708/500000] + train/ActionNoiseL2Loss=0.1067 + throughput/total_tokens=1,287,936,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=6709/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,288,128,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=6710/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,288,320,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=6711/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=1,288,512,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=6712/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=1,288,704,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=6713/500000] + train/ActionNoiseL2Loss=0.1225 + throughput/total_tokens=1,288,896,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=6714/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=1,289,088,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=6715/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=1,289,280,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=6716/500000] + train/ActionNoiseL2Loss=0.0999 + throughput/total_tokens=1,289,472,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=6717/500000] + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=1,289,664,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=6718/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=1,289,856,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=6719/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,290,048,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=6720/500000] + optim/total_grad_norm=1.303 + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,290,240,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=6721/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=1,290,432,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6722/500000] + train/ActionNoiseL2Loss=0.1000 + throughput/total_tokens=1,290,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6723/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,290,816,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6724/500000] + train/ActionNoiseL2Loss=0.1036 + throughput/total_tokens=1,291,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6725/500000] + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=1,291,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6726/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=1,291,392,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6727/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=1,291,584,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6728/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=1,291,776,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6729/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,291,968,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6730/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=1,292,160,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6731/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=1,292,352,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6732/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=1,292,544,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6733/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=1,292,736,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6734/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=1,292,928,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6735/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,293,120,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6736/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=1,293,312,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6737/500000] + train/ActionNoiseL2Loss=0.0866 + throughput/total_tokens=1,293,504,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6738/500000] + train/ActionNoiseL2Loss=0.0149 + throughput/total_tokens=1,293,696,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6739/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=1,293,888,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6740/500000] + optim/total_grad_norm=1.025 + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,294,080,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=6741/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,294,272,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6742/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=1,294,464,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=6743/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=1,294,656,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6744/500000] + train/ActionNoiseL2Loss=0.0993 + throughput/total_tokens=1,294,848,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6745/500000] + train/ActionNoiseL2Loss=0.1668 + throughput/total_tokens=1,295,040,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6746/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=1,295,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6747/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=1,295,424,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6748/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=1,295,616,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6749/500000] + train/ActionNoiseL2Loss=0.1082 + throughput/total_tokens=1,295,808,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6750/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,296,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6751/500000] + train/ActionNoiseL2Loss=0.1374 + throughput/total_tokens=1,296,192,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6752/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,296,384,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6753/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,296,576,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6754/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=1,296,768,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6755/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,296,960,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6756/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,297,152,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6757/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,297,344,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6758/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,297,536,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=6759/500000] + train/ActionNoiseL2Loss=0.1247 + throughput/total_tokens=1,297,728,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6760/500000] + optim/total_grad_norm=1.625 + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=1,297,920,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=6761/500000] + train/ActionNoiseL2Loss=0.2227 + throughput/total_tokens=1,298,112,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6762/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=1,298,304,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6763/500000] + train/ActionNoiseL2Loss=0.0388 + throughput/total_tokens=1,298,496,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6764/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=1,298,688,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6765/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=1,298,880,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6766/500000] + train/ActionNoiseL2Loss=0.0776 + throughput/total_tokens=1,299,072,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6767/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=1,299,264,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6768/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,299,456,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6769/500000] + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=1,299,648,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6770/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=1,299,840,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6771/500000] + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=1,300,032,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6772/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=1,300,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6773/500000] + train/ActionNoiseL2Loss=0.0325 + throughput/total_tokens=1,300,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6774/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,300,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6775/500000] + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=1,300,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6776/500000] + train/ActionNoiseL2Loss=0.0279 + throughput/total_tokens=1,300,992,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6777/500000] + train/ActionNoiseL2Loss=0.1182 + throughput/total_tokens=1,301,184,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6778/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,301,376,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6779/500000] + train/ActionNoiseL2Loss=0.1638 + throughput/total_tokens=1,301,568,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6780/500000] + optim/total_grad_norm=1.542 + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=1,301,760,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6781/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,301,952,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6782/500000] + train/ActionNoiseL2Loss=0.0896 + throughput/total_tokens=1,302,144,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6783/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,302,336,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6784/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,302,528,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6785/500000] + train/ActionNoiseL2Loss=0.1855 + throughput/total_tokens=1,302,720,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6786/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=1,302,912,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6787/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=1,303,104,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6788/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,303,296,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6789/500000] + train/ActionNoiseL2Loss=0.0827 + throughput/total_tokens=1,303,488,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6790/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=1,303,680,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6791/500000] + train/ActionNoiseL2Loss=0.0920 + throughput/total_tokens=1,303,872,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6792/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,304,064,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6793/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=1,304,256,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6794/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=1,304,448,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6795/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,304,640,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6796/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=1,304,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6797/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=1,305,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6798/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=1,305,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6799/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,305,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6800/500000] + optim/total_grad_norm=1.434 + train/ActionNoiseL2Loss=0.1123 + throughput/total_tokens=1,305,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6801/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,305,792,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6802/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=1,305,984,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6803/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,306,176,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6804/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=1,306,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6805/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,306,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6806/500000] + train/ActionNoiseL2Loss=0.1051 + throughput/total_tokens=1,306,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6807/500000] + train/ActionNoiseL2Loss=0.1166 + throughput/total_tokens=1,306,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6808/500000] + train/ActionNoiseL2Loss=0.0809 + throughput/total_tokens=1,307,136,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6809/500000] + train/ActionNoiseL2Loss=0.1080 + throughput/total_tokens=1,307,328,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6810/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=1,307,520,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=6811/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,307,712,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6812/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=1,307,904,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6813/500000] + train/ActionNoiseL2Loss=0.0785 + throughput/total_tokens=1,308,096,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6814/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,308,288,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6815/500000] + train/ActionNoiseL2Loss=0.0747 + throughput/total_tokens=1,308,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6816/500000] + train/ActionNoiseL2Loss=0.0408 + throughput/total_tokens=1,308,672,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6817/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,308,864,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6818/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,309,056,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6819/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,309,248,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6820/500000] + optim/total_grad_norm=1.695 + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=1,309,440,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6821/500000] + train/ActionNoiseL2Loss=0.1431 + throughput/total_tokens=1,309,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6822/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=1,309,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6823/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=1,310,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6824/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=1,310,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6825/500000] + train/ActionNoiseL2Loss=0.1019 + throughput/total_tokens=1,310,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6826/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=1,310,592,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6827/500000] + train/ActionNoiseL2Loss=0.0298 + throughput/total_tokens=1,310,784,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6828/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=1,310,976,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6829/500000] + train/ActionNoiseL2Loss=0.0872 + throughput/total_tokens=1,311,168,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6830/500000] + train/ActionNoiseL2Loss=0.0818 + throughput/total_tokens=1,311,360,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6831/500000] + train/ActionNoiseL2Loss=0.1399 + throughput/total_tokens=1,311,552,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6832/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=1,311,744,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6833/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,311,936,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6834/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,312,128,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6835/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,312,320,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6836/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=1,312,512,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6837/500000] + train/ActionNoiseL2Loss=0.1381 + throughput/total_tokens=1,312,704,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6838/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=1,312,896,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6839/500000] + train/ActionNoiseL2Loss=0.0268 + throughput/total_tokens=1,313,088,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6840/500000] + optim/total_grad_norm=1.331 + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,313,280,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6841/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,313,472,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6842/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=1,313,664,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6843/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,313,856,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6844/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,314,048,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6845/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=1,314,240,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6846/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=1,314,432,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6847/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=1,314,624,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6848/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=1,314,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6849/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,315,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=6850/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=1,315,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6851/500000] + train/ActionNoiseL2Loss=0.0314 + throughput/total_tokens=1,315,392,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6852/500000] + train/ActionNoiseL2Loss=0.0709 + throughput/total_tokens=1,315,584,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6853/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,315,776,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=6854/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=1,315,968,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6855/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=1,316,160,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6856/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=1,316,352,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6857/500000] + train/ActionNoiseL2Loss=0.0932 + throughput/total_tokens=1,316,544,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6858/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=1,316,736,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6859/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,316,928,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6860/500000] + optim/total_grad_norm=1.329 + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=1,317,120,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=6861/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=1,317,312,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6862/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,317,504,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6863/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=1,317,696,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6864/500000] + train/ActionNoiseL2Loss=0.1040 + throughput/total_tokens=1,317,888,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6865/500000] + train/ActionNoiseL2Loss=0.0387 + throughput/total_tokens=1,318,080,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6866/500000] + train/ActionNoiseL2Loss=0.1373 + throughput/total_tokens=1,318,272,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6867/500000] + train/ActionNoiseL2Loss=0.0226 + throughput/total_tokens=1,318,464,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6868/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=1,318,656,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6869/500000] + train/ActionNoiseL2Loss=0.0294 + throughput/total_tokens=1,318,848,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=6870/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,319,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6871/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,319,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6872/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=1,319,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6873/500000] + train/ActionNoiseL2Loss=0.0918 + throughput/total_tokens=1,319,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6874/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,319,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6875/500000] + train/ActionNoiseL2Loss=0.1082 + throughput/total_tokens=1,320,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6876/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=1,320,192,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6877/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=1,320,384,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6878/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,320,576,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6879/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,320,768,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6880/500000] + optim/total_grad_norm=1.045 + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,320,960,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6881/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,321,152,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6882/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=1,321,344,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6883/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,321,536,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6884/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=1,321,728,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6885/500000] + train/ActionNoiseL2Loss=0.0840 + throughput/total_tokens=1,321,920,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6886/500000] + train/ActionNoiseL2Loss=0.1177 + throughput/total_tokens=1,322,112,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6887/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=1,322,304,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6888/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,322,496,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6889/500000] + train/ActionNoiseL2Loss=0.0241 + throughput/total_tokens=1,322,688,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6890/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=1,322,880,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6891/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,323,072,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6892/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=1,323,264,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6893/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,323,456,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6894/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,323,648,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6895/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,323,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6896/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,324,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6897/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,324,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6898/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,324,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6899/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,324,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6900/500000] + optim/total_grad_norm=1.712 + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,324,800,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6901/500000] + train/ActionNoiseL2Loss=0.0965 + throughput/total_tokens=1,324,992,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6902/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=1,325,184,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6903/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=1,325,376,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6904/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=1,325,568,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6905/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,325,760,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6906/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=1,325,952,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6907/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=1,326,144,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6908/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=1,326,336,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6909/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,326,528,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=6910/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=1,326,720,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=6911/500000] + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=1,326,912,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6912/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=1,327,104,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6913/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,327,296,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6914/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=1,327,488,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6915/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=1,327,680,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6916/500000] + train/ActionNoiseL2Loss=0.1050 + throughput/total_tokens=1,327,872,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6917/500000] + train/ActionNoiseL2Loss=0.0920 + throughput/total_tokens=1,328,064,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6918/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,328,256,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6919/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,328,448,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6920/500000] + optim/total_grad_norm=1.889 + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,328,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6921/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=1,328,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6922/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,329,024,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6923/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,329,216,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6924/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=1,329,408,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6925/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,329,600,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6926/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,329,792,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6927/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=1,329,984,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6928/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=1,330,176,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6929/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=1,330,368,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6930/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,330,560,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6931/500000] + train/ActionNoiseL2Loss=0.0343 + throughput/total_tokens=1,330,752,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6932/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=1,330,944,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6933/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=1,331,136,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6934/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,331,328,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6935/500000] + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=1,331,520,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6936/500000] + train/ActionNoiseL2Loss=0.0302 + throughput/total_tokens=1,331,712,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6937/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,331,904,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6938/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=1,332,096,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6939/500000] + train/ActionNoiseL2Loss=0.0329 + throughput/total_tokens=1,332,288,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6940/500000] + optim/total_grad_norm=1.224 + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=1,332,480,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6941/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,332,672,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6942/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,332,864,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6943/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=1,333,056,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6944/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,333,248,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6945/500000] + train/ActionNoiseL2Loss=0.0309 + throughput/total_tokens=1,333,440,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6946/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,333,632,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6947/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=1,333,824,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6948/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,334,016,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6949/500000] + train/ActionNoiseL2Loss=0.1141 + throughput/total_tokens=1,334,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6950/500000] + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=1,334,400,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6951/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=1,334,592,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6952/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,334,784,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6953/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=1,334,976,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6954/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,335,168,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6955/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,335,360,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6956/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=1,335,552,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6957/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,335,744,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6958/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=1,335,936,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6959/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,336,128,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6960/500000] + optim/total_grad_norm=1.083 + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=1,336,320,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=6961/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,336,512,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6962/500000] + train/ActionNoiseL2Loss=0.0314 + throughput/total_tokens=1,336,704,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6963/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=1,336,896,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6964/500000] + train/ActionNoiseL2Loss=0.1120 + throughput/total_tokens=1,337,088,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6965/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,337,280,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6966/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=1,337,472,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6967/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=1,337,664,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6968/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,337,856,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6969/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,338,048,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=6970/500000] + train/ActionNoiseL2Loss=0.0823 + throughput/total_tokens=1,338,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6971/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,338,432,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6972/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=1,338,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6973/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=1,338,816,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6974/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=1,339,008,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6975/500000] + train/ActionNoiseL2Loss=0.0359 + throughput/total_tokens=1,339,200,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6976/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,339,392,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6977/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,339,584,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6978/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=1,339,776,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6979/500000] + train/ActionNoiseL2Loss=0.0942 + throughput/total_tokens=1,339,968,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6980/500000] + optim/total_grad_norm=2.083 + train/ActionNoiseL2Loss=0.0936 + throughput/total_tokens=1,340,160,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6981/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,340,352,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6982/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=1,340,544,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6983/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,340,736,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6984/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,340,928,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6985/500000] + train/ActionNoiseL2Loss=0.0936 + throughput/total_tokens=1,341,120,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6986/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,341,312,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6987/500000] + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=1,341,504,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6988/500000] + train/ActionNoiseL2Loss=0.0318 + throughput/total_tokens=1,341,696,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=6989/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=1,341,888,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6990/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=1,342,080,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=6991/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=1,342,272,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6992/500000] + train/ActionNoiseL2Loss=0.0311 + throughput/total_tokens=1,342,464,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6993/500000] + train/ActionNoiseL2Loss=0.0792 + throughput/total_tokens=1,342,656,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6994/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,342,848,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6995/500000] + train/ActionNoiseL2Loss=0.1073 + throughput/total_tokens=1,343,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6996/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=1,343,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6997/500000] + train/ActionNoiseL2Loss=0.0326 + throughput/total_tokens=1,343,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6998/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=1,343,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=6999/500000] + train/ActionNoiseL2Loss=0.1034 + throughput/total_tokens=1,343,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7000/500000] + optim/total_grad_norm=1.136 + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=1,344,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +10/07 [10:11:03] INFO | >> Saving config... checkpoint.py:608 +10/07 [10:11:38] INFO | >> Saving model state... checkpoint.py:796 +10/07 [10:12:52] INFO | >> Saving optim state... checkpoint.py:811 +10/07 [10:14:25] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=7001/500000] + train/ActionNoiseL2Loss=0.0893 + throughput/total_tokens=1,344,192,000 + throughput/device/tokens_per_second=1,192 + throughput/device/batches_per_second=0.0497 +[step=7002/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,344,384,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7003/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=1,344,576,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7004/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=1,344,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7005/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=1,344,960,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7006/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=1,345,152,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7007/500000] + train/ActionNoiseL2Loss=0.0888 + throughput/total_tokens=1,345,344,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=7008/500000] + train/ActionNoiseL2Loss=0.0302 + throughput/total_tokens=1,345,536,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7009/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,345,728,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7010/500000] + train/ActionNoiseL2Loss=0.1299 + throughput/total_tokens=1,345,920,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=7011/500000] + train/ActionNoiseL2Loss=0.0785 + throughput/total_tokens=1,346,112,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7012/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=1,346,304,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7013/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,346,496,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7014/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,346,688,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7015/500000] + train/ActionNoiseL2Loss=0.0820 + throughput/total_tokens=1,346,880,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7016/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,347,072,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7017/500000] + train/ActionNoiseL2Loss=0.1133 + throughput/total_tokens=1,347,264,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7018/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=1,347,456,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7019/500000] + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=1,347,648,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7020/500000] + optim/total_grad_norm=2.323 + train/ActionNoiseL2Loss=0.0893 + throughput/total_tokens=1,347,840,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=7021/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=1,348,032,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7022/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=1,348,224,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7023/500000] + train/ActionNoiseL2Loss=0.1664 + throughput/total_tokens=1,348,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7024/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=1,348,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7025/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=1,348,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7026/500000] + train/ActionNoiseL2Loss=0.1121 + throughput/total_tokens=1,348,992,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7027/500000] + train/ActionNoiseL2Loss=0.0311 + throughput/total_tokens=1,349,184,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7028/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=1,349,376,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7029/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,349,568,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7030/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=1,349,760,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7031/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=1,349,952,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7032/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=1,350,144,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7033/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=1,350,336,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7034/500000] + train/ActionNoiseL2Loss=0.0276 + throughput/total_tokens=1,350,528,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7035/500000] + train/ActionNoiseL2Loss=0.0884 + throughput/total_tokens=1,350,720,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7036/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=1,350,912,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7037/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,351,104,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7038/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,351,296,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7039/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,351,488,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7040/500000] + optim/total_grad_norm=1.832 + train/ActionNoiseL2Loss=0.0387 + throughput/total_tokens=1,351,680,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7041/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=1,351,872,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7042/500000] + train/ActionNoiseL2Loss=0.1503 + throughput/total_tokens=1,352,064,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7043/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=1,352,256,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7044/500000] + train/ActionNoiseL2Loss=0.0969 + throughput/total_tokens=1,352,448,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7045/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=1,352,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7046/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,352,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7047/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,353,024,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7048/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=1,353,216,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7049/500000] + train/ActionNoiseL2Loss=0.0838 + throughput/total_tokens=1,353,408,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7050/500000] + train/ActionNoiseL2Loss=0.0971 + throughput/total_tokens=1,353,600,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7051/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,353,792,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7052/500000] + train/ActionNoiseL2Loss=0.1119 + throughput/total_tokens=1,353,984,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7053/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=1,354,176,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7054/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,354,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7055/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,354,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7056/500000] + train/ActionNoiseL2Loss=0.0929 + throughput/total_tokens=1,354,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7057/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,354,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7058/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=1,355,136,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7059/500000] + train/ActionNoiseL2Loss=0.0288 + throughput/total_tokens=1,355,328,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7060/500000] + optim/total_grad_norm=1.091 + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=1,355,520,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=7061/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=1,355,712,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7062/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=1,355,904,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7063/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=1,356,096,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7064/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,356,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7065/500000] + train/ActionNoiseL2Loss=0.0194 + throughput/total_tokens=1,356,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7066/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=1,356,672,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7067/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,356,864,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7068/500000] + train/ActionNoiseL2Loss=0.0320 + throughput/total_tokens=1,357,056,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7069/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=1,357,248,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7070/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=1,357,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7071/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,357,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7072/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=1,357,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7073/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,358,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7074/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,358,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7075/500000] + train/ActionNoiseL2Loss=0.0247 + throughput/total_tokens=1,358,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7076/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,358,592,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7077/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=1,358,784,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7078/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=1,358,976,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7079/500000] + train/ActionNoiseL2Loss=0.0263 + throughput/total_tokens=1,359,168,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7080/500000] + optim/total_grad_norm=1.450 + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,359,360,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7081/500000] + train/ActionNoiseL2Loss=0.1536 + throughput/total_tokens=1,359,552,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7082/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,359,744,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7083/500000] + train/ActionNoiseL2Loss=0.1041 + throughput/total_tokens=1,359,936,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7084/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=1,360,128,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7085/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,360,320,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7086/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,360,512,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7087/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=1,360,704,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7088/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=1,360,896,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7089/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,361,088,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7090/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,361,280,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7091/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,361,472,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7092/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=1,361,664,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7093/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=1,361,856,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7094/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,362,048,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7095/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=1,362,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7096/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,362,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7097/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,362,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7098/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,362,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7099/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=1,363,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7100/500000] + optim/total_grad_norm=1.013 + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=1,363,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7101/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,363,392,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7102/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=1,363,584,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7103/500000] + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=1,363,776,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7104/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=1,363,968,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7105/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,364,160,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7106/500000] + train/ActionNoiseL2Loss=0.0411 + throughput/total_tokens=1,364,352,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7107/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,364,544,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7108/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=1,364,736,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7109/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,364,928,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7110/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=1,365,120,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=7111/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,365,312,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7112/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=1,365,504,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7113/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=1,365,696,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7114/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=1,365,888,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7115/500000] + train/ActionNoiseL2Loss=0.0851 + throughput/total_tokens=1,366,080,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7116/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=1,366,272,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7117/500000] + train/ActionNoiseL2Loss=0.0279 + throughput/total_tokens=1,366,464,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7118/500000] + train/ActionNoiseL2Loss=0.0242 + throughput/total_tokens=1,366,656,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7119/500000] + train/ActionNoiseL2Loss=0.0246 + throughput/total_tokens=1,366,848,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7120/500000] + optim/total_grad_norm=1.676 + train/ActionNoiseL2Loss=0.1018 + throughput/total_tokens=1,367,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7121/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=1,367,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7122/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,367,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7123/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=1,367,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7124/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=1,367,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7125/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=1,368,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7126/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,368,192,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7127/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,368,384,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7128/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,368,576,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7129/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,368,768,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7130/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,368,960,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7131/500000] + train/ActionNoiseL2Loss=0.0273 + throughput/total_tokens=1,369,152,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7132/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,369,344,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7133/500000] + train/ActionNoiseL2Loss=0.0287 + throughput/total_tokens=1,369,536,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7134/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,369,728,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7135/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=1,369,920,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7136/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=1,370,112,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7137/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=1,370,304,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7138/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=1,370,496,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7139/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,370,688,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7140/500000] + optim/total_grad_norm=1.728 + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=1,370,880,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7141/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,371,072,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7142/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,371,264,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7143/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=1,371,456,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7144/500000] + train/ActionNoiseL2Loss=0.0949 + throughput/total_tokens=1,371,648,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7145/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=1,371,840,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7146/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=1,372,032,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7147/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,372,224,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7148/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=1,372,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7149/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,372,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7150/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=1,372,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7151/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,372,992,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7152/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=1,373,184,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7153/500000] + train/ActionNoiseL2Loss=0.0872 + throughput/total_tokens=1,373,376,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7154/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=1,373,568,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7155/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,373,760,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7156/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=1,373,952,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7157/500000] + train/ActionNoiseL2Loss=0.0993 + throughput/total_tokens=1,374,144,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7158/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,374,336,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7159/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,374,528,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7160/500000] + optim/total_grad_norm=1.395 + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=1,374,720,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=7161/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=1,374,912,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7162/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,375,104,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7163/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=1,375,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7164/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=1,375,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7165/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=1,375,680,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7166/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=1,375,872,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7167/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,376,064,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7168/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,376,256,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7169/500000] + train/ActionNoiseL2Loss=0.0836 + throughput/total_tokens=1,376,448,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7170/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,376,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7171/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,376,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7172/500000] + train/ActionNoiseL2Loss=0.0990 + throughput/total_tokens=1,377,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7173/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,377,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7174/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=1,377,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7175/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=1,377,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7176/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=1,377,792,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7177/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,377,984,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7178/500000] + train/ActionNoiseL2Loss=0.0905 + throughput/total_tokens=1,378,176,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7179/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,378,368,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7180/500000] + optim/total_grad_norm=1.139 + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,378,560,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7181/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,378,752,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7182/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=1,378,944,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7183/500000] + train/ActionNoiseL2Loss=0.0329 + throughput/total_tokens=1,379,136,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7184/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,379,328,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7185/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,379,520,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7186/500000] + train/ActionNoiseL2Loss=0.1593 + throughput/total_tokens=1,379,712,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7187/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,379,904,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7188/500000] + train/ActionNoiseL2Loss=0.1207 + throughput/total_tokens=1,380,096,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7189/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=1,380,288,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7190/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=1,380,480,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7191/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=1,380,672,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7192/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=1,380,864,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7193/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=1,381,056,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7194/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,381,248,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7195/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,381,440,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7196/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=1,381,632,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7197/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,381,824,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7198/500000] + train/ActionNoiseL2Loss=0.0820 + throughput/total_tokens=1,382,016,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7199/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,382,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7200/500000] + optim/total_grad_norm=1.797 + train/ActionNoiseL2Loss=0.1035 + throughput/total_tokens=1,382,400,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7201/500000] + train/ActionNoiseL2Loss=0.1020 + throughput/total_tokens=1,382,592,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7202/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=1,382,784,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7203/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=1,382,976,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7204/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=1,383,168,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7205/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,383,360,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7206/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,383,552,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7207/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,383,744,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7208/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=1,383,936,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7209/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,384,128,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7210/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,384,320,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=7211/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=1,384,512,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7212/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=1,384,704,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7213/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=1,384,896,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7214/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,385,088,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7215/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=1,385,280,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7216/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=1,385,472,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7217/500000] + train/ActionNoiseL2Loss=0.0865 + throughput/total_tokens=1,385,664,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7218/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=1,385,856,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7219/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=1,386,048,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7220/500000] + optim/total_grad_norm=1.862 + train/ActionNoiseL2Loss=0.0942 + throughput/total_tokens=1,386,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7221/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,386,432,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7222/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,386,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7223/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,386,816,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7224/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,387,008,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7225/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=1,387,200,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7226/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=1,387,392,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7227/500000] + train/ActionNoiseL2Loss=0.1039 + throughput/total_tokens=1,387,584,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7228/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=1,387,776,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7229/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,387,968,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7230/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=1,388,160,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7231/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=1,388,352,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7232/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,388,544,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7233/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=1,388,736,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7234/500000] + train/ActionNoiseL2Loss=0.0273 + throughput/total_tokens=1,388,928,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7235/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=1,389,120,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7236/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=1,389,312,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7237/500000] + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=1,389,504,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7238/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,389,696,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7239/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,389,888,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7240/500000] + optim/total_grad_norm=1.327 + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,390,080,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7241/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=1,390,272,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7242/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=1,390,464,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7243/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,390,656,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7244/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,390,848,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7245/500000] + train/ActionNoiseL2Loss=0.0238 + throughput/total_tokens=1,391,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7246/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=1,391,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7247/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=1,391,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7248/500000] + train/ActionNoiseL2Loss=0.0905 + throughput/total_tokens=1,391,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7249/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,391,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7250/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=1,392,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7251/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,392,192,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7252/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,392,384,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7253/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=1,392,576,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7254/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=1,392,768,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7255/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,392,960,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7256/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=1,393,152,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7257/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=1,393,344,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7258/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,393,536,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7259/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,393,728,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7260/500000] + optim/total_grad_norm=1.559 + train/ActionNoiseL2Loss=0.0871 + throughput/total_tokens=1,393,920,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=7261/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=1,394,112,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7262/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=1,394,304,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7263/500000] + train/ActionNoiseL2Loss=0.0984 + throughput/total_tokens=1,394,496,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7264/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=1,394,688,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7265/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=1,394,880,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7266/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,395,072,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7267/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=1,395,264,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7268/500000] + train/ActionNoiseL2Loss=0.1094 + throughput/total_tokens=1,395,456,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7269/500000] + train/ActionNoiseL2Loss=0.0388 + throughput/total_tokens=1,395,648,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=7270/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=1,395,840,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=7271/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=1,396,032,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7272/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=1,396,224,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7273/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,396,416,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7274/500000] + train/ActionNoiseL2Loss=0.1287 + throughput/total_tokens=1,396,608,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7275/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,396,800,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7276/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=1,396,992,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7277/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=1,397,184,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7278/500000] + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=1,397,376,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7279/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,397,568,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7280/500000] + optim/total_grad_norm=0.9627 + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=1,397,760,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=7281/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=1,397,952,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7282/500000] + train/ActionNoiseL2Loss=0.0391 + throughput/total_tokens=1,398,144,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7283/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=1,398,336,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7284/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,398,528,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7285/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=1,398,720,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7286/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,398,912,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7287/500000] + train/ActionNoiseL2Loss=0.0876 + throughput/total_tokens=1,399,104,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7288/500000] + train/ActionNoiseL2Loss=0.0977 + throughput/total_tokens=1,399,296,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7289/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,399,488,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7290/500000] + train/ActionNoiseL2Loss=0.0930 + throughput/total_tokens=1,399,680,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7291/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,399,872,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7292/500000] + train/ActionNoiseL2Loss=0.1232 + throughput/total_tokens=1,400,064,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7293/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,400,256,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7294/500000] + train/ActionNoiseL2Loss=0.0809 + throughput/total_tokens=1,400,448,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7295/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=1,400,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7296/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,400,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7297/500000] + train/ActionNoiseL2Loss=0.0325 + throughput/total_tokens=1,401,024,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7298/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,401,216,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7299/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=1,401,408,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7300/500000] + optim/total_grad_norm=1.067 + train/ActionNoiseL2Loss=0.0343 + throughput/total_tokens=1,401,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7301/500000] + train/ActionNoiseL2Loss=0.1160 + throughput/total_tokens=1,401,792,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7302/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,401,984,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7303/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=1,402,176,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7304/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=1,402,368,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7305/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,402,560,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7306/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,402,752,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7307/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=1,402,944,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7308/500000] + train/ActionNoiseL2Loss=0.0303 + throughput/total_tokens=1,403,136,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7309/500000] + train/ActionNoiseL2Loss=0.0965 + throughput/total_tokens=1,403,328,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7310/500000] + train/ActionNoiseL2Loss=0.0272 + throughput/total_tokens=1,403,520,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=7311/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,403,712,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7312/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=1,403,904,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7313/500000] + train/ActionNoiseL2Loss=0.1732 + throughput/total_tokens=1,404,096,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7314/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,404,288,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7315/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=1,404,480,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7316/500000] + train/ActionNoiseL2Loss=0.0215 + throughput/total_tokens=1,404,672,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7317/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=1,404,864,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7318/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=1,405,056,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7319/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=1,405,248,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7320/500000] + optim/total_grad_norm=1.835 + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=1,405,440,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7321/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=1,405,632,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7322/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=1,405,824,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7323/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,406,016,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7324/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=1,406,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7325/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,406,400,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7326/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,406,592,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7327/500000] + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=1,406,784,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7328/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,406,976,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7329/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,407,168,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7330/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=1,407,360,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=7331/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,407,552,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7332/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=1,407,744,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7333/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,407,936,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7334/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,408,128,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7335/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=1,408,320,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7336/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,408,512,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7337/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=1,408,704,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7338/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=1,408,896,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7339/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=1,409,088,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7340/500000] + optim/total_grad_norm=1.273 + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=1,409,280,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=7341/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,409,472,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7342/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,409,664,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7343/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,409,856,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7344/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,410,048,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7345/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,410,240,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7346/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,410,432,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7347/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=1,410,624,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7348/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,410,816,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7349/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,411,008,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7350/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,411,200,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7351/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=1,411,392,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7352/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=1,411,584,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7353/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=1,411,776,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7354/500000] + train/ActionNoiseL2Loss=0.0871 + throughput/total_tokens=1,411,968,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7355/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,412,160,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7356/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,412,352,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7357/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,412,544,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7358/500000] + train/ActionNoiseL2Loss=0.0833 + throughput/total_tokens=1,412,736,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7359/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,412,928,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7360/500000] + optim/total_grad_norm=1.088 + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=1,413,120,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=7361/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=1,413,312,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7362/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,413,504,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7363/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,413,696,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7364/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,413,888,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7365/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=1,414,080,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7366/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,414,272,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7367/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,414,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7368/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,414,656,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7369/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=1,414,848,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7370/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=1,415,040,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7371/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=1,415,232,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7372/500000] + train/ActionNoiseL2Loss=0.0289 + throughput/total_tokens=1,415,424,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7373/500000] + train/ActionNoiseL2Loss=0.0772 + throughput/total_tokens=1,415,616,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7374/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,415,808,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7375/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=1,416,000,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7376/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=1,416,192,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7377/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=1,416,384,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7378/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,416,576,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7379/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,416,768,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7380/500000] + optim/total_grad_norm=1.912 + train/ActionNoiseL2Loss=0.1216 + throughput/total_tokens=1,416,960,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7381/500000] + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=1,417,152,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7382/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=1,417,344,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7383/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=1,417,536,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7384/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,417,728,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7385/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=1,417,920,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7386/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=1,418,112,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7387/500000] + train/ActionNoiseL2Loss=0.0330 + throughput/total_tokens=1,418,304,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7388/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=1,418,496,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7389/500000] + train/ActionNoiseL2Loss=0.0355 + throughput/total_tokens=1,418,688,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7390/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=1,418,880,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7391/500000] + train/ActionNoiseL2Loss=0.0994 + throughput/total_tokens=1,419,072,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7392/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,419,264,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7393/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=1,419,456,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7394/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=1,419,648,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7395/500000] + train/ActionNoiseL2Loss=0.0315 + throughput/total_tokens=1,419,840,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7396/500000] + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=1,420,032,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7397/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,420,224,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7398/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=1,420,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7399/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,420,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7400/500000] + optim/total_grad_norm=1.260 + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=1,420,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7401/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,420,992,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7402/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=1,421,184,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7403/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=1,421,376,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7404/500000] + train/ActionNoiseL2Loss=0.1286 + throughput/total_tokens=1,421,568,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7405/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=1,421,760,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7406/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=1,421,952,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7407/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,422,144,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7408/500000] + train/ActionNoiseL2Loss=0.0253 + throughput/total_tokens=1,422,336,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7409/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,422,528,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7410/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,422,720,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=7411/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=1,422,912,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7412/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,423,104,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7413/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,423,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7414/500000] + train/ActionNoiseL2Loss=0.0951 + throughput/total_tokens=1,423,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7415/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,423,680,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7416/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=1,423,872,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7417/500000] + train/ActionNoiseL2Loss=0.1010 + throughput/total_tokens=1,424,064,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7418/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,424,256,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7419/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,424,448,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7420/500000] + optim/total_grad_norm=1.315 + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,424,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7421/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=1,424,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7422/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=1,425,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7423/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=1,425,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7424/500000] + train/ActionNoiseL2Loss=0.0337 + throughput/total_tokens=1,425,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7425/500000] + train/ActionNoiseL2Loss=0.0922 + throughput/total_tokens=1,425,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7426/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,425,792,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7427/500000] + train/ActionNoiseL2Loss=0.0226 + throughput/total_tokens=1,425,984,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7428/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=1,426,176,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7429/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,426,368,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7430/500000] + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=1,426,560,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7431/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,426,752,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7432/500000] + train/ActionNoiseL2Loss=0.0922 + throughput/total_tokens=1,426,944,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7433/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,427,136,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7434/500000] + train/ActionNoiseL2Loss=0.1015 + throughput/total_tokens=1,427,328,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7435/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,427,520,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7436/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=1,427,712,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7437/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,427,904,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7438/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,428,096,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7439/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,428,288,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7440/500000] + optim/total_grad_norm=1.047 + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,428,480,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7441/500000] + train/ActionNoiseL2Loss=0.0288 + throughput/total_tokens=1,428,672,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7442/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=1,428,864,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7443/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,429,056,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7444/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,429,248,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7445/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=1,429,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7446/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,429,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7447/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,429,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7448/500000] + train/ActionNoiseL2Loss=0.0902 + throughput/total_tokens=1,430,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7449/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=1,430,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7450/500000] + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=1,430,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7451/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=1,430,592,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7452/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,430,784,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7453/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=1,430,976,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7454/500000] + train/ActionNoiseL2Loss=0.0266 + throughput/total_tokens=1,431,168,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7455/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,431,360,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7456/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,431,552,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7457/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=1,431,744,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7458/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,431,936,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7459/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,432,128,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7460/500000] + optim/total_grad_norm=1.599 + train/ActionNoiseL2Loss=0.1132 + throughput/total_tokens=1,432,320,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=7461/500000] + train/ActionNoiseL2Loss=0.0977 + throughput/total_tokens=1,432,512,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7462/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=1,432,704,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7463/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=1,432,896,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7464/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,433,088,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7465/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=1,433,280,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7466/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=1,433,472,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7467/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=1,433,664,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7468/500000] + train/ActionNoiseL2Loss=0.0297 + throughput/total_tokens=1,433,856,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7469/500000] + train/ActionNoiseL2Loss=0.0820 + throughput/total_tokens=1,434,048,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7470/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,434,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7471/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,434,432,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7472/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,434,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7473/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=1,434,816,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7474/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=1,435,008,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7475/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=1,435,200,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7476/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,435,392,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7477/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,435,584,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7478/500000] + train/ActionNoiseL2Loss=0.0332 + throughput/total_tokens=1,435,776,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7479/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=1,435,968,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7480/500000] + optim/total_grad_norm=2.449 + train/ActionNoiseL2Loss=0.0895 + throughput/total_tokens=1,436,160,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7481/500000] + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=1,436,352,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7482/500000] + train/ActionNoiseL2Loss=0.0408 + throughput/total_tokens=1,436,544,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7483/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,436,736,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7484/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=1,436,928,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7485/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=1,437,120,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7486/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,437,312,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7487/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=1,437,504,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7488/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=1,437,696,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7489/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,437,888,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7490/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=1,438,080,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7491/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,438,272,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7492/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=1,438,464,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7493/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=1,438,656,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7494/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=1,438,848,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7495/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,439,040,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7496/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=1,439,232,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7497/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,439,424,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7498/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,439,616,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7499/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,439,808,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7500/500000] + optim/total_grad_norm=1.497 + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,440,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +10/07 [13:08:47] INFO | >> Saving config... checkpoint.py:608 +10/07 [13:09:36] INFO | >> Saving model state... checkpoint.py:796 +10/07 [13:10:49] INFO | >> Saving optim state... checkpoint.py:811 +10/07 [13:12:23] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=7501/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,440,192,000 + throughput/device/tokens_per_second=1,196 + throughput/device/batches_per_second=0.0498 +[step=7502/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=1,440,384,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7503/500000] + train/ActionNoiseL2Loss=0.0335 + throughput/total_tokens=1,440,576,000 + throughput/device/tokens_per_second=1,167 + throughput/device/batches_per_second=0.0487 +[step=7504/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,440,768,000 + throughput/device/tokens_per_second=1,164 + throughput/device/batches_per_second=0.0485 +[step=7505/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,440,960,000 + throughput/device/tokens_per_second=1,163 + throughput/device/batches_per_second=0.0485 +[step=7506/500000] + train/ActionNoiseL2Loss=0.0408 + throughput/total_tokens=1,441,152,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=7507/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,441,344,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=7508/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=1,441,536,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=7509/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=1,441,728,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=7510/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,441,920,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7511/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=1,442,112,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7512/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,442,304,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7513/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,442,496,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7514/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=1,442,688,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7515/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,442,880,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7516/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=1,443,072,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7517/500000] + train/ActionNoiseL2Loss=0.0983 + throughput/total_tokens=1,443,264,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7518/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,443,456,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7519/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,443,648,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7520/500000] + optim/total_grad_norm=1.501 + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,443,840,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7521/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,444,032,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7522/500000] + train/ActionNoiseL2Loss=0.0332 + throughput/total_tokens=1,444,224,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7523/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,444,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7524/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=1,444,608,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7525/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,444,800,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7526/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=1,444,992,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7527/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,445,184,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7528/500000] + train/ActionNoiseL2Loss=0.0859 + throughput/total_tokens=1,445,376,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7529/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,445,568,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7530/500000] + train/ActionNoiseL2Loss=0.0331 + throughput/total_tokens=1,445,760,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7531/500000] + train/ActionNoiseL2Loss=0.0359 + throughput/total_tokens=1,445,952,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7532/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=1,446,144,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7533/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=1,446,336,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7534/500000] + train/ActionNoiseL2Loss=0.0331 + throughput/total_tokens=1,446,528,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7535/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=1,446,720,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7536/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=1,446,912,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7537/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,447,104,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7538/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=1,447,296,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7539/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,447,488,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7540/500000] + optim/total_grad_norm=1.330 + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,447,680,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7541/500000] + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=1,447,872,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7542/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=1,448,064,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7543/500000] + train/ActionNoiseL2Loss=0.0258 + throughput/total_tokens=1,448,256,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7544/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=1,448,448,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7545/500000] + train/ActionNoiseL2Loss=0.0257 + throughput/total_tokens=1,448,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7546/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=1,448,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7547/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,449,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7548/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,449,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7549/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=1,449,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7550/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=1,449,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7551/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=1,449,792,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7552/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=1,449,984,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7553/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=1,450,176,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7554/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,450,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7555/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=1,450,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7556/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,450,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7557/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=1,450,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7558/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=1,451,136,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7559/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,451,328,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7560/500000] + optim/total_grad_norm=0.8735 + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=1,451,520,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=7561/500000] + train/ActionNoiseL2Loss=0.0367 + throughput/total_tokens=1,451,712,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7562/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,451,904,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7563/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=1,452,096,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7564/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,452,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7565/500000] + train/ActionNoiseL2Loss=0.0296 + throughput/total_tokens=1,452,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7566/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,452,672,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7567/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,452,864,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7568/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=1,453,056,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7569/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=1,453,248,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7570/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=1,453,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7571/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,453,632,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7572/500000] + train/ActionNoiseL2Loss=0.0991 + throughput/total_tokens=1,453,824,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7573/500000] + train/ActionNoiseL2Loss=0.0339 + throughput/total_tokens=1,454,016,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7574/500000] + train/ActionNoiseL2Loss=0.0267 + throughput/total_tokens=1,454,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7575/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=1,454,400,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7576/500000] + train/ActionNoiseL2Loss=0.0264 + throughput/total_tokens=1,454,592,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7577/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=1,454,784,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7578/500000] + train/ActionNoiseL2Loss=0.0941 + throughput/total_tokens=1,454,976,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7579/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=1,455,168,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7580/500000] + optim/total_grad_norm=1.567 + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=1,455,360,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7581/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,455,552,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7582/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=1,455,744,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7583/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=1,455,936,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7584/500000] + train/ActionNoiseL2Loss=0.0201 + throughput/total_tokens=1,456,128,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7585/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,456,320,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7586/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,456,512,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7587/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,456,704,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7588/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,456,896,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7589/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=1,457,088,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7590/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=1,457,280,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7591/500000] + train/ActionNoiseL2Loss=0.0265 + throughput/total_tokens=1,457,472,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7592/500000] + train/ActionNoiseL2Loss=0.1143 + throughput/total_tokens=1,457,664,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7593/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,457,856,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7594/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=1,458,048,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7595/500000] + train/ActionNoiseL2Loss=0.0219 + throughput/total_tokens=1,458,240,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7596/500000] + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=1,458,432,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7597/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=1,458,624,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7598/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=1,458,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7599/500000] + train/ActionNoiseL2Loss=0.0824 + throughput/total_tokens=1,459,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7600/500000] + optim/total_grad_norm=1.383 + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,459,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7601/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=1,459,392,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7602/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=1,459,584,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7603/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=1,459,776,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7604/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,459,968,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7605/500000] + train/ActionNoiseL2Loss=0.0189 + throughput/total_tokens=1,460,160,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7606/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=1,460,352,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7607/500000] + train/ActionNoiseL2Loss=0.1411 + throughput/total_tokens=1,460,544,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7608/500000] + train/ActionNoiseL2Loss=0.0385 + throughput/total_tokens=1,460,736,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7609/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,460,928,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7610/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=1,461,120,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=7611/500000] + train/ActionNoiseL2Loss=0.1197 + throughput/total_tokens=1,461,312,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7612/500000] + train/ActionNoiseL2Loss=0.0367 + throughput/total_tokens=1,461,504,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7613/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=1,461,696,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7614/500000] + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=1,461,888,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7615/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=1,462,080,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7616/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,462,272,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7617/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,462,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7618/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,462,656,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7619/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=1,462,848,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=7620/500000] + optim/total_grad_norm=1.574 + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=1,463,040,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7621/500000] + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=1,463,232,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7622/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=1,463,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7623/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,463,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7624/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=1,463,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7625/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,464,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7626/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=1,464,192,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7627/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,464,384,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7628/500000] + train/ActionNoiseL2Loss=0.1339 + throughput/total_tokens=1,464,576,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7629/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=1,464,768,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7630/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,464,960,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7631/500000] + train/ActionNoiseL2Loss=0.0212 + throughput/total_tokens=1,465,152,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7632/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=1,465,344,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7633/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=1,465,536,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7634/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,465,728,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7635/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,465,920,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7636/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=1,466,112,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7637/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,466,304,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7638/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=1,466,496,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7639/500000] + train/ActionNoiseL2Loss=0.1050 + throughput/total_tokens=1,466,688,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7640/500000] + optim/total_grad_norm=2.016 + train/ActionNoiseL2Loss=0.1161 + throughput/total_tokens=1,466,880,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7641/500000] + train/ActionNoiseL2Loss=0.0337 + throughput/total_tokens=1,467,072,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7642/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,467,264,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7643/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,467,456,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7644/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=1,467,648,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7645/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=1,467,840,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7646/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=1,468,032,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7647/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,468,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7648/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,468,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7649/500000] + train/ActionNoiseL2Loss=0.1038 + throughput/total_tokens=1,468,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7650/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,468,800,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7651/500000] + train/ActionNoiseL2Loss=0.1078 + throughput/total_tokens=1,468,992,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7652/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=1,469,184,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7653/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,469,376,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7654/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=1,469,568,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7655/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=1,469,760,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7656/500000] + train/ActionNoiseL2Loss=0.1002 + throughput/total_tokens=1,469,952,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7657/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,470,144,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7658/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,470,336,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7659/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,470,528,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7660/500000] + optim/total_grad_norm=1.156 + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=1,470,720,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=7661/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=1,470,912,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7662/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=1,471,104,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7663/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=1,471,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7664/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,471,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7665/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,471,680,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7666/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,471,872,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7667/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,472,064,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7668/500000] + train/ActionNoiseL2Loss=0.1013 + throughput/total_tokens=1,472,256,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7669/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,472,448,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7670/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=1,472,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7671/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=1,472,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7672/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=1,473,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7673/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=1,473,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7674/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=1,473,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7675/500000] + train/ActionNoiseL2Loss=0.0324 + throughput/total_tokens=1,473,600,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7676/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=1,473,792,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7677/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,473,984,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7678/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=1,474,176,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7679/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,474,368,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7680/500000] + optim/total_grad_norm=1.283 + train/ActionNoiseL2Loss=0.0411 + throughput/total_tokens=1,474,560,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7681/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,474,752,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7682/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=1,474,944,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7683/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,475,136,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7684/500000] + train/ActionNoiseL2Loss=0.1150 + throughput/total_tokens=1,475,328,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7685/500000] + train/ActionNoiseL2Loss=0.0918 + throughput/total_tokens=1,475,520,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7686/500000] + train/ActionNoiseL2Loss=0.0282 + throughput/total_tokens=1,475,712,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7687/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,475,904,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7688/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=1,476,096,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7689/500000] + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=1,476,288,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7690/500000] + train/ActionNoiseL2Loss=0.0967 + throughput/total_tokens=1,476,480,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7691/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,476,672,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7692/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=1,476,864,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7693/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=1,477,056,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7694/500000] + train/ActionNoiseL2Loss=0.0241 + throughput/total_tokens=1,477,248,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7695/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,477,440,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7696/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=1,477,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7697/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=1,477,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7698/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=1,478,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7699/500000] + train/ActionNoiseL2Loss=0.0709 + throughput/total_tokens=1,478,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7700/500000] + optim/total_grad_norm=1.193 + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=1,478,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7701/500000] + train/ActionNoiseL2Loss=0.0981 + throughput/total_tokens=1,478,592,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7702/500000] + train/ActionNoiseL2Loss=0.0859 + throughput/total_tokens=1,478,784,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7703/500000] + train/ActionNoiseL2Loss=0.0219 + throughput/total_tokens=1,478,976,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7704/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,479,168,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7705/500000] + train/ActionNoiseL2Loss=0.0355 + throughput/total_tokens=1,479,360,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7706/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,479,552,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7707/500000] + train/ActionNoiseL2Loss=0.0293 + throughput/total_tokens=1,479,744,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7708/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,479,936,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7709/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=1,480,128,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7710/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=1,480,320,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=7711/500000] + train/ActionNoiseL2Loss=0.0273 + throughput/total_tokens=1,480,512,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7712/500000] + train/ActionNoiseL2Loss=0.0969 + throughput/total_tokens=1,480,704,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7713/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,480,896,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7714/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=1,481,088,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7715/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=1,481,280,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7716/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,481,472,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7717/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,481,664,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7718/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=1,481,856,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7719/500000] + train/ActionNoiseL2Loss=0.0888 + throughput/total_tokens=1,482,048,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7720/500000] + optim/total_grad_norm=1.482 + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=1,482,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7721/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=1,482,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7722/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,482,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7723/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,482,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7724/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,483,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7725/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=1,483,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7726/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,483,392,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7727/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=1,483,584,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7728/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,483,776,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7729/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,483,968,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7730/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=1,484,160,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7731/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,484,352,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7732/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=1,484,544,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7733/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=1,484,736,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7734/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=1,484,928,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7735/500000] + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=1,485,120,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7736/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=1,485,312,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7737/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=1,485,504,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7738/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=1,485,696,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7739/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=1,485,888,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7740/500000] + optim/total_grad_norm=1.352 + train/ActionNoiseL2Loss=0.0954 + throughput/total_tokens=1,486,080,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7741/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=1,486,272,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7742/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,486,464,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7743/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=1,486,656,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7744/500000] + train/ActionNoiseL2Loss=0.1725 + throughput/total_tokens=1,486,848,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7745/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=1,487,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7746/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=1,487,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7747/500000] + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=1,487,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7748/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=1,487,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7749/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=1,487,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7750/500000] + train/ActionNoiseL2Loss=0.0280 + throughput/total_tokens=1,488,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7751/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,488,192,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7752/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,488,384,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7753/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,488,576,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7754/500000] + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=1,488,768,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7755/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,488,960,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7756/500000] + train/ActionNoiseL2Loss=0.1000 + throughput/total_tokens=1,489,152,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7757/500000] + train/ActionNoiseL2Loss=0.0370 + throughput/total_tokens=1,489,344,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7758/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=1,489,536,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7759/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=1,489,728,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7760/500000] + optim/total_grad_norm=1.133 + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,489,920,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7761/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,490,112,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7762/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=1,490,304,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7763/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,490,496,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7764/500000] + train/ActionNoiseL2Loss=0.0318 + throughput/total_tokens=1,490,688,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7765/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,490,880,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7766/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=1,491,072,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7767/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,491,264,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7768/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=1,491,456,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7769/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=1,491,648,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7770/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=1,491,840,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7771/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=1,492,032,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7772/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=1,492,224,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7773/500000] + train/ActionNoiseL2Loss=0.0181 + throughput/total_tokens=1,492,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7774/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,492,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7775/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=1,492,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7776/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=1,492,992,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7777/500000] + train/ActionNoiseL2Loss=0.1122 + throughput/total_tokens=1,493,184,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7778/500000] + train/ActionNoiseL2Loss=0.1045 + throughput/total_tokens=1,493,376,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7779/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=1,493,568,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7780/500000] + optim/total_grad_norm=1.002 + train/ActionNoiseL2Loss=0.0289 + throughput/total_tokens=1,493,760,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7781/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,493,952,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7782/500000] + train/ActionNoiseL2Loss=0.0239 + throughput/total_tokens=1,494,144,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7783/500000] + train/ActionNoiseL2Loss=0.0251 + throughput/total_tokens=1,494,336,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7784/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,494,528,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7785/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=1,494,720,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7786/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=1,494,912,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7787/500000] + train/ActionNoiseL2Loss=0.1579 + throughput/total_tokens=1,495,104,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7788/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,495,296,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7789/500000] + train/ActionNoiseL2Loss=0.1484 + throughput/total_tokens=1,495,488,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7790/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,495,680,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7791/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=1,495,872,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7792/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,496,064,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7793/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,496,256,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7794/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=1,496,448,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7795/500000] + train/ActionNoiseL2Loss=0.0919 + throughput/total_tokens=1,496,640,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7796/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,496,832,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7797/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,497,024,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7798/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=1,497,216,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7799/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=1,497,408,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7800/500000] + optim/total_grad_norm=1.330 + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=1,497,600,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7801/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,497,792,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7802/500000] + train/ActionNoiseL2Loss=0.1212 + throughput/total_tokens=1,497,984,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7803/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,498,176,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7804/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,498,368,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7805/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=1,498,560,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7806/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=1,498,752,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7807/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,498,944,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7808/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=1,499,136,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7809/500000] + train/ActionNoiseL2Loss=0.0874 + throughput/total_tokens=1,499,328,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7810/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=1,499,520,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7811/500000] + train/ActionNoiseL2Loss=0.0827 + throughput/total_tokens=1,499,712,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7812/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,499,904,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7813/500000] + train/ActionNoiseL2Loss=0.0951 + throughput/total_tokens=1,500,096,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7814/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,500,288,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7815/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,500,480,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7816/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=1,500,672,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7817/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,500,864,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7818/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,501,056,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7819/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=1,501,248,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7820/500000] + optim/total_grad_norm=1.293 + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,501,440,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7821/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=1,501,632,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7822/500000] + train/ActionNoiseL2Loss=0.1026 + throughput/total_tokens=1,501,824,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7823/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=1,502,016,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7824/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=1,502,208,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7825/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,502,400,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7826/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,502,592,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7827/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,502,784,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7828/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,502,976,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7829/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,503,168,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7830/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=1,503,360,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7831/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,503,552,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7832/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=1,503,744,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7833/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=1,503,936,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7834/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=1,504,128,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7835/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=1,504,320,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7836/500000] + train/ActionNoiseL2Loss=0.0934 + throughput/total_tokens=1,504,512,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7837/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,504,704,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7838/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,504,896,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7839/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,505,088,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7840/500000] + optim/total_grad_norm=1.210 + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,505,280,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7841/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,505,472,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7842/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=1,505,664,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7843/500000] + train/ActionNoiseL2Loss=0.0975 + throughput/total_tokens=1,505,856,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7844/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=1,506,048,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7845/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=1,506,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7846/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,506,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7847/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,506,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7848/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,506,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7849/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,507,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7850/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,507,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7851/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,507,392,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7852/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,507,584,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7853/500000] + train/ActionNoiseL2Loss=0.1008 + throughput/total_tokens=1,507,776,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7854/500000] + train/ActionNoiseL2Loss=0.1038 + throughput/total_tokens=1,507,968,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7855/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,508,160,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7856/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,508,352,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7857/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,508,544,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7858/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,508,736,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7859/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,508,928,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7860/500000] + optim/total_grad_norm=1.606 + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=1,509,120,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=7861/500000] + train/ActionNoiseL2Loss=0.0293 + throughput/total_tokens=1,509,312,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7862/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,509,504,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7863/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,509,696,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7864/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=1,509,888,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7865/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=1,510,080,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7866/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=1,510,272,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7867/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,510,464,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7868/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,510,656,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7869/500000] + train/ActionNoiseL2Loss=0.0962 + throughput/total_tokens=1,510,848,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7870/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,511,040,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7871/500000] + train/ActionNoiseL2Loss=0.0160 + throughput/total_tokens=1,511,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7872/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,511,424,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7873/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,511,616,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7874/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,511,808,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7875/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,512,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7876/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=1,512,192,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7877/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,512,384,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7878/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,512,576,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7879/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=1,512,768,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7880/500000] + optim/total_grad_norm=0.9641 + train/ActionNoiseL2Loss=0.0315 + throughput/total_tokens=1,512,960,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7881/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=1,513,152,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7882/500000] + train/ActionNoiseL2Loss=0.0833 + throughput/total_tokens=1,513,344,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7883/500000] + train/ActionNoiseL2Loss=0.0355 + throughput/total_tokens=1,513,536,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7884/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=1,513,728,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7885/500000] + train/ActionNoiseL2Loss=0.0905 + throughput/total_tokens=1,513,920,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7886/500000] + train/ActionNoiseL2Loss=0.1357 + throughput/total_tokens=1,514,112,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7887/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=1,514,304,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7888/500000] + train/ActionNoiseL2Loss=0.0284 + throughput/total_tokens=1,514,496,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7889/500000] + train/ActionNoiseL2Loss=0.0954 + throughput/total_tokens=1,514,688,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7890/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=1,514,880,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7891/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=1,515,072,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7892/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=1,515,264,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7893/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,515,456,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7894/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=1,515,648,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7895/500000] + train/ActionNoiseL2Loss=0.0318 + throughput/total_tokens=1,515,840,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7896/500000] + train/ActionNoiseL2Loss=0.0957 + throughput/total_tokens=1,516,032,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7897/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,516,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7898/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,516,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7899/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=1,516,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7900/500000] + optim/total_grad_norm=1.632 + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=1,516,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7901/500000] + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=1,516,992,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7902/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=1,517,184,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7903/500000] + train/ActionNoiseL2Loss=0.0956 + throughput/total_tokens=1,517,376,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7904/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,517,568,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7905/500000] + train/ActionNoiseL2Loss=0.0845 + throughput/total_tokens=1,517,760,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7906/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,517,952,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7907/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,518,144,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7908/500000] + train/ActionNoiseL2Loss=0.1020 + throughput/total_tokens=1,518,336,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7909/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,518,528,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7910/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=1,518,720,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=7911/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,518,912,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7912/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=1,519,104,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7913/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,519,296,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7914/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=1,519,488,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7915/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=1,519,680,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7916/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,519,872,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7917/500000] + train/ActionNoiseL2Loss=0.1101 + throughput/total_tokens=1,520,064,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7918/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,520,256,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7919/500000] + train/ActionNoiseL2Loss=0.0326 + throughput/total_tokens=1,520,448,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=7920/500000] + optim/total_grad_norm=1.271 + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,520,640,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7921/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,520,832,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7922/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=1,521,024,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7923/500000] + train/ActionNoiseL2Loss=0.0276 + throughput/total_tokens=1,521,216,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7924/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,521,408,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7925/500000] + train/ActionNoiseL2Loss=0.1076 + throughput/total_tokens=1,521,600,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7926/500000] + train/ActionNoiseL2Loss=0.1163 + throughput/total_tokens=1,521,792,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7927/500000] + train/ActionNoiseL2Loss=0.0301 + throughput/total_tokens=1,521,984,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7928/500000] + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=1,522,176,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7929/500000] + train/ActionNoiseL2Loss=0.0935 + throughput/total_tokens=1,522,368,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7930/500000] + train/ActionNoiseL2Loss=0.0930 + throughput/total_tokens=1,522,560,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7931/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,522,752,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7932/500000] + train/ActionNoiseL2Loss=0.0250 + throughput/total_tokens=1,522,944,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7933/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,523,136,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7934/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,523,328,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7935/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,523,520,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7936/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=1,523,712,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7937/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=1,523,904,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7938/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,524,096,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7939/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,524,288,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7940/500000] + optim/total_grad_norm=1.305 + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,524,480,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7941/500000] + train/ActionNoiseL2Loss=0.0827 + throughput/total_tokens=1,524,672,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7942/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=1,524,864,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7943/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,525,056,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7944/500000] + train/ActionNoiseL2Loss=0.0237 + throughput/total_tokens=1,525,248,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7945/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,525,440,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7946/500000] + train/ActionNoiseL2Loss=0.1001 + throughput/total_tokens=1,525,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7947/500000] + train/ActionNoiseL2Loss=0.0367 + throughput/total_tokens=1,525,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7948/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=1,526,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7949/500000] + train/ActionNoiseL2Loss=0.0361 + throughput/total_tokens=1,526,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7950/500000] + train/ActionNoiseL2Loss=0.0311 + throughput/total_tokens=1,526,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7951/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,526,592,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7952/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,526,784,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7953/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=1,526,976,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7954/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,527,168,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7955/500000] + train/ActionNoiseL2Loss=0.1147 + throughput/total_tokens=1,527,360,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=7956/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=1,527,552,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7957/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,527,744,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7958/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=1,527,936,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7959/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,528,128,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7960/500000] + optim/total_grad_norm=0.9730 + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,528,320,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=7961/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=1,528,512,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7962/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=1,528,704,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7963/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,528,896,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=7964/500000] + train/ActionNoiseL2Loss=0.0820 + throughput/total_tokens=1,529,088,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7965/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,529,280,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7966/500000] + train/ActionNoiseL2Loss=0.0391 + throughput/total_tokens=1,529,472,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7967/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=1,529,664,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7968/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=1,529,856,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7969/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,530,048,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=7970/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=1,530,240,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=7971/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,530,432,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7972/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=1,530,624,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7973/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,530,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7974/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,531,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7975/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,531,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=7976/500000] + train/ActionNoiseL2Loss=0.0216 + throughput/total_tokens=1,531,392,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=7977/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=1,531,584,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7978/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,531,776,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7979/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,531,968,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7980/500000] + optim/total_grad_norm=1.184 + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,532,160,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7981/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=1,532,352,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7982/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,532,544,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7983/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=1,532,736,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=7984/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,532,928,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7985/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,533,120,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7986/500000] + train/ActionNoiseL2Loss=0.0296 + throughput/total_tokens=1,533,312,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7987/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=1,533,504,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7988/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,533,696,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7989/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,533,888,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7990/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=1,534,080,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=7991/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=1,534,272,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7992/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=1,534,464,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7993/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=1,534,656,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7994/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,534,848,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7995/500000] + train/ActionNoiseL2Loss=0.0311 + throughput/total_tokens=1,535,040,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7996/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,535,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7997/500000] + train/ActionNoiseL2Loss=0.0165 + throughput/total_tokens=1,535,424,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7998/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,535,616,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=7999/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,535,808,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8000/500000] + optim/total_grad_norm=1.130 + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=1,536,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +10/07 [16:06:51] INFO | >> Saving config... checkpoint.py:608 +10/07 [16:07:24] INFO | >> Saving model state... checkpoint.py:796 +10/07 [16:08:38] INFO | >> Saving optim state... checkpoint.py:811 +10/07 [16:10:12] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=8001/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=1,536,192,000 + throughput/device/tokens_per_second=1,186 + throughput/device/batches_per_second=0.0494 +[step=8002/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,536,384,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8003/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=1,536,576,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8004/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,536,768,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8005/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=1,536,960,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8006/500000] + train/ActionNoiseL2Loss=0.0809 + throughput/total_tokens=1,537,152,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8007/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=1,537,344,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8008/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=1,537,536,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8009/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=1,537,728,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8010/500000] + train/ActionNoiseL2Loss=0.1015 + throughput/total_tokens=1,537,920,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8011/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=1,538,112,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8012/500000] + train/ActionNoiseL2Loss=0.0198 + throughput/total_tokens=1,538,304,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8013/500000] + train/ActionNoiseL2Loss=0.0278 + throughput/total_tokens=1,538,496,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8014/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=1,538,688,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8015/500000] + train/ActionNoiseL2Loss=0.1368 + throughput/total_tokens=1,538,880,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8016/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=1,539,072,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8017/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,539,264,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8018/500000] + train/ActionNoiseL2Loss=0.0297 + throughput/total_tokens=1,539,456,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8019/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=1,539,648,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8020/500000] + optim/total_grad_norm=2.193 + train/ActionNoiseL2Loss=0.1167 + throughput/total_tokens=1,539,840,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8021/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=1,540,032,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8022/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,540,224,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8023/500000] + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=1,540,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8024/500000] + train/ActionNoiseL2Loss=0.0314 + throughput/total_tokens=1,540,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8025/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,540,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8026/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=1,540,992,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8027/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=1,541,184,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8028/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,541,376,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8029/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,541,568,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8030/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=1,541,760,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8031/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,541,952,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8032/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=1,542,144,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8033/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,542,336,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8034/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=1,542,528,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8035/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=1,542,720,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8036/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,542,912,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8037/500000] + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=1,543,104,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8038/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,543,296,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8039/500000] + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=1,543,488,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8040/500000] + optim/total_grad_norm=1.177 + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=1,543,680,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8041/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=1,543,872,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8042/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=1,544,064,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8043/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,544,256,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8044/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,544,448,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8045/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=1,544,640,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8046/500000] + train/ActionNoiseL2Loss=0.0957 + throughput/total_tokens=1,544,832,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8047/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,545,024,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8048/500000] + train/ActionNoiseL2Loss=0.0311 + throughput/total_tokens=1,545,216,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8049/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=1,545,408,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8050/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=1,545,600,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8051/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=1,545,792,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8052/500000] + train/ActionNoiseL2Loss=0.0279 + throughput/total_tokens=1,545,984,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8053/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=1,546,176,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8054/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,546,368,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8055/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,546,560,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8056/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=1,546,752,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8057/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,546,944,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8058/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=1,547,136,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8059/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=1,547,328,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8060/500000] + optim/total_grad_norm=1.385 + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=1,547,520,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8061/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=1,547,712,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8062/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,547,904,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8063/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,548,096,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8064/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,548,288,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8065/500000] + train/ActionNoiseL2Loss=0.0286 + throughput/total_tokens=1,548,480,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8066/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,548,672,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8067/500000] + train/ActionNoiseL2Loss=0.0809 + throughput/total_tokens=1,548,864,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8068/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,549,056,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8069/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,549,248,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8070/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=1,549,440,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8071/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=1,549,632,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8072/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,549,824,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8073/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=1,550,016,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8074/500000] + train/ActionNoiseL2Loss=0.0977 + throughput/total_tokens=1,550,208,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8075/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,550,400,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8076/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=1,550,592,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8077/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=1,550,784,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8078/500000] + train/ActionNoiseL2Loss=0.1428 + throughput/total_tokens=1,550,976,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8079/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=1,551,168,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8080/500000] + optim/total_grad_norm=1.480 + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,551,360,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8081/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=1,551,552,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8082/500000] + train/ActionNoiseL2Loss=0.1466 + throughput/total_tokens=1,551,744,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8083/500000] + train/ActionNoiseL2Loss=0.0254 + throughput/total_tokens=1,551,936,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8084/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,552,128,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8085/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=1,552,320,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8086/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=1,552,512,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8087/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=1,552,704,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8088/500000] + train/ActionNoiseL2Loss=0.0269 + throughput/total_tokens=1,552,896,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8089/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=1,553,088,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8090/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=1,553,280,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8091/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,553,472,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8092/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=1,553,664,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8093/500000] + train/ActionNoiseL2Loss=0.0332 + throughput/total_tokens=1,553,856,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8094/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=1,554,048,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8095/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=1,554,240,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8096/500000] + train/ActionNoiseL2Loss=0.0237 + throughput/total_tokens=1,554,432,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8097/500000] + train/ActionNoiseL2Loss=0.0337 + throughput/total_tokens=1,554,624,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8098/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,554,816,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8099/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,555,008,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8100/500000] + optim/total_grad_norm=1.443 + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=1,555,200,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8101/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=1,555,392,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8102/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,555,584,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8103/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,555,776,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8104/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=1,555,968,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8105/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,556,160,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8106/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,556,352,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8107/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=1,556,544,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8108/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=1,556,736,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8109/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,556,928,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8110/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,557,120,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8111/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=1,557,312,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8112/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=1,557,504,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8113/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,557,696,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8114/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=1,557,888,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8115/500000] + train/ActionNoiseL2Loss=0.1039 + throughput/total_tokens=1,558,080,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8116/500000] + train/ActionNoiseL2Loss=0.1185 + throughput/total_tokens=1,558,272,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8117/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,558,464,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8118/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=1,558,656,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8119/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=1,558,848,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8120/500000] + optim/total_grad_norm=1.167 + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=1,559,040,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8121/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=1,559,232,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8122/500000] + train/ActionNoiseL2Loss=0.0285 + throughput/total_tokens=1,559,424,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8123/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,559,616,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8124/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=1,559,808,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8125/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=1,560,000,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8126/500000] + train/ActionNoiseL2Loss=0.0194 + throughput/total_tokens=1,560,192,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8127/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=1,560,384,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8128/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,560,576,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8129/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=1,560,768,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8130/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,560,960,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8131/500000] + train/ActionNoiseL2Loss=0.0239 + throughput/total_tokens=1,561,152,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8132/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=1,561,344,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8133/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,561,536,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8134/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=1,561,728,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8135/500000] + train/ActionNoiseL2Loss=0.0367 + throughput/total_tokens=1,561,920,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8136/500000] + train/ActionNoiseL2Loss=0.0203 + throughput/total_tokens=1,562,112,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8137/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,562,304,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8138/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,562,496,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8139/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,562,688,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8140/500000] + optim/total_grad_norm=1.121 + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=1,562,880,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8141/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=1,563,072,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8142/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=1,563,264,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8143/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=1,563,456,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8144/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,563,648,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8145/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=1,563,840,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8146/500000] + train/ActionNoiseL2Loss=0.0921 + throughput/total_tokens=1,564,032,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8147/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=1,564,224,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8148/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=1,564,416,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8149/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=1,564,608,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8150/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,564,800,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8151/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=1,564,992,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8152/500000] + train/ActionNoiseL2Loss=0.1084 + throughput/total_tokens=1,565,184,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8153/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=1,565,376,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8154/500000] + train/ActionNoiseL2Loss=0.0301 + throughput/total_tokens=1,565,568,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8155/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,565,760,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8156/500000] + train/ActionNoiseL2Loss=0.0772 + throughput/total_tokens=1,565,952,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8157/500000] + train/ActionNoiseL2Loss=0.0944 + throughput/total_tokens=1,566,144,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8158/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,566,336,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8159/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=1,566,528,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8160/500000] + optim/total_grad_norm=1.248 + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=1,566,720,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8161/500000] + train/ActionNoiseL2Loss=0.0330 + throughput/total_tokens=1,566,912,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8162/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,567,104,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8163/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,567,296,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8164/500000] + train/ActionNoiseL2Loss=0.0299 + throughput/total_tokens=1,567,488,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8165/500000] + train/ActionNoiseL2Loss=0.1071 + throughput/total_tokens=1,567,680,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8166/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,567,872,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8167/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,568,064,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8168/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=1,568,256,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8169/500000] + train/ActionNoiseL2Loss=0.0313 + throughput/total_tokens=1,568,448,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8170/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,568,640,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8171/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,568,832,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8172/500000] + train/ActionNoiseL2Loss=0.0984 + throughput/total_tokens=1,569,024,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8173/500000] + train/ActionNoiseL2Loss=0.0982 + throughput/total_tokens=1,569,216,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8174/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=1,569,408,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8175/500000] + train/ActionNoiseL2Loss=0.0925 + throughput/total_tokens=1,569,600,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8176/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=1,569,792,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8177/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=1,569,984,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8178/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,570,176,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8179/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=1,570,368,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8180/500000] + optim/total_grad_norm=1.262 + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=1,570,560,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8181/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,570,752,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8182/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,570,944,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8183/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=1,571,136,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8184/500000] + train/ActionNoiseL2Loss=0.1200 + throughput/total_tokens=1,571,328,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8185/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,571,520,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8186/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,571,712,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8187/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=1,571,904,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8188/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=1,572,096,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8189/500000] + train/ActionNoiseL2Loss=0.0939 + throughput/total_tokens=1,572,288,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8190/500000] + train/ActionNoiseL2Loss=0.1050 + throughput/total_tokens=1,572,480,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8191/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=1,572,672,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8192/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=1,572,864,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8193/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,573,056,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8194/500000] + train/ActionNoiseL2Loss=0.0929 + throughput/total_tokens=1,573,248,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8195/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,573,440,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8196/500000] + train/ActionNoiseL2Loss=0.0320 + throughput/total_tokens=1,573,632,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8197/500000] + train/ActionNoiseL2Loss=0.0267 + throughput/total_tokens=1,573,824,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8198/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,574,016,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8199/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,574,208,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8200/500000] + optim/total_grad_norm=2.440 + train/ActionNoiseL2Loss=0.1138 + throughput/total_tokens=1,574,400,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8201/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,574,592,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8202/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,574,784,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8203/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=1,574,976,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8204/500000] + train/ActionNoiseL2Loss=0.0338 + throughput/total_tokens=1,575,168,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8205/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=1,575,360,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8206/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,575,552,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8207/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,575,744,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8208/500000] + train/ActionNoiseL2Loss=0.0314 + throughput/total_tokens=1,575,936,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8209/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=1,576,128,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8210/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,576,320,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8211/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,576,512,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8212/500000] + train/ActionNoiseL2Loss=0.0306 + throughput/total_tokens=1,576,704,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8213/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=1,576,896,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8214/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,577,088,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8215/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,577,280,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8216/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,577,472,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8217/500000] + train/ActionNoiseL2Loss=0.0985 + throughput/total_tokens=1,577,664,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8218/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,577,856,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8219/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,578,048,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8220/500000] + optim/total_grad_norm=1.423 + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=1,578,240,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8221/500000] + train/ActionNoiseL2Loss=0.0388 + throughput/total_tokens=1,578,432,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8222/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=1,578,624,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8223/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=1,578,816,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8224/500000] + train/ActionNoiseL2Loss=0.1154 + throughput/total_tokens=1,579,008,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8225/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=1,579,200,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8226/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,579,392,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8227/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,579,584,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8228/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=1,579,776,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8229/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,579,968,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8230/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=1,580,160,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8231/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=1,580,352,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8232/500000] + train/ActionNoiseL2Loss=0.0331 + throughput/total_tokens=1,580,544,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8233/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,580,736,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8234/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,580,928,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8235/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=1,581,120,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8236/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=1,581,312,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8237/500000] + train/ActionNoiseL2Loss=0.1079 + throughput/total_tokens=1,581,504,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8238/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,581,696,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8239/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=1,581,888,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8240/500000] + optim/total_grad_norm=1.305 + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,582,080,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8241/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=1,582,272,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8242/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=1,582,464,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8243/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=1,582,656,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8244/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,582,848,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8245/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=1,583,040,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8246/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=1,583,232,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8247/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=1,583,424,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8248/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=1,583,616,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8249/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=1,583,808,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8250/500000] + train/ActionNoiseL2Loss=0.1062 + throughput/total_tokens=1,584,000,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8251/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,584,192,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8252/500000] + train/ActionNoiseL2Loss=0.1080 + throughput/total_tokens=1,584,384,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8253/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,584,576,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8254/500000] + train/ActionNoiseL2Loss=0.0277 + throughput/total_tokens=1,584,768,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8255/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=1,584,960,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8256/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=1,585,152,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8257/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,585,344,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8258/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,585,536,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8259/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,585,728,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8260/500000] + optim/total_grad_norm=1.121 + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,585,920,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8261/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,586,112,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8262/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=1,586,304,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8263/500000] + train/ActionNoiseL2Loss=0.0388 + throughput/total_tokens=1,586,496,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8264/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,586,688,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8265/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,586,880,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8266/500000] + train/ActionNoiseL2Loss=0.0309 + throughput/total_tokens=1,587,072,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8267/500000] + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=1,587,264,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8268/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,587,456,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8269/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,587,648,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8270/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=1,587,840,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8271/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,588,032,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8272/500000] + train/ActionNoiseL2Loss=0.0272 + throughput/total_tokens=1,588,224,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8273/500000] + train/ActionNoiseL2Loss=0.0691 + throughput/total_tokens=1,588,416,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8274/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,588,608,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8275/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=1,588,800,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8276/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=1,588,992,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8277/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,589,184,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8278/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,589,376,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8279/500000] + train/ActionNoiseL2Loss=0.1096 + throughput/total_tokens=1,589,568,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8280/500000] + optim/total_grad_norm=0.8844 + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=1,589,760,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8281/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=1,589,952,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8282/500000] + train/ActionNoiseL2Loss=0.1257 + throughput/total_tokens=1,590,144,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8283/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,590,336,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8284/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,590,528,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8285/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,590,720,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8286/500000] + train/ActionNoiseL2Loss=0.0280 + throughput/total_tokens=1,590,912,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8287/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,591,104,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8288/500000] + train/ActionNoiseL2Loss=0.0290 + throughput/total_tokens=1,591,296,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8289/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,591,488,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8290/500000] + train/ActionNoiseL2Loss=0.1267 + throughput/total_tokens=1,591,680,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8291/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,591,872,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8292/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=1,592,064,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8293/500000] + train/ActionNoiseL2Loss=0.0331 + throughput/total_tokens=1,592,256,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8294/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=1,592,448,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8295/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,592,640,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8296/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,592,832,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8297/500000] + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=1,593,024,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8298/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=1,593,216,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8299/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=1,593,408,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8300/500000] + optim/total_grad_norm=1.226 + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,593,600,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8301/500000] + train/ActionNoiseL2Loss=0.0211 + throughput/total_tokens=1,593,792,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8302/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,593,984,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8303/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=1,594,176,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8304/500000] + train/ActionNoiseL2Loss=0.0247 + throughput/total_tokens=1,594,368,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8305/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,594,560,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8306/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,594,752,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8307/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,594,944,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8308/500000] + train/ActionNoiseL2Loss=0.0345 + throughput/total_tokens=1,595,136,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8309/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=1,595,328,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8310/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,595,520,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8311/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,595,712,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8312/500000] + train/ActionNoiseL2Loss=0.0237 + throughput/total_tokens=1,595,904,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8313/500000] + train/ActionNoiseL2Loss=0.0987 + throughput/total_tokens=1,596,096,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8314/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,596,288,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8315/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=1,596,480,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8316/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,596,672,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8317/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=1,596,864,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8318/500000] + train/ActionNoiseL2Loss=0.0264 + throughput/total_tokens=1,597,056,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8319/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,597,248,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8320/500000] + optim/total_grad_norm=1.664 + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=1,597,440,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8321/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,597,632,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8322/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,597,824,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8323/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,598,016,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8324/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,598,208,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8325/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=1,598,400,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8326/500000] + train/ActionNoiseL2Loss=0.0776 + throughput/total_tokens=1,598,592,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8327/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,598,784,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8328/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,598,976,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8329/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=1,599,168,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8330/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,599,360,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8331/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=1,599,552,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8332/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,599,744,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8333/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,599,936,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8334/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,600,128,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8335/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=1,600,320,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8336/500000] + train/ActionNoiseL2Loss=0.0301 + throughput/total_tokens=1,600,512,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8337/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=1,600,704,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8338/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=1,600,896,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8339/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,601,088,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8340/500000] + optim/total_grad_norm=1.161 + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,601,280,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8341/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=1,601,472,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8342/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=1,601,664,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8343/500000] + train/ActionNoiseL2Loss=0.0355 + throughput/total_tokens=1,601,856,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8344/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,602,048,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8345/500000] + train/ActionNoiseL2Loss=0.1273 + throughput/total_tokens=1,602,240,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8346/500000] + train/ActionNoiseL2Loss=0.0340 + throughput/total_tokens=1,602,432,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8347/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=1,602,624,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8348/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=1,602,816,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8349/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=1,603,008,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8350/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=1,603,200,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8351/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,603,392,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8352/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=1,603,584,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8353/500000] + train/ActionNoiseL2Loss=0.1221 + throughput/total_tokens=1,603,776,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8354/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=1,603,968,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8355/500000] + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=1,604,160,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8356/500000] + train/ActionNoiseL2Loss=0.0308 + throughput/total_tokens=1,604,352,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8357/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,604,544,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8358/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=1,604,736,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8359/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,604,928,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8360/500000] + optim/total_grad_norm=2.594 + train/ActionNoiseL2Loss=0.1262 + throughput/total_tokens=1,605,120,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=8361/500000] + train/ActionNoiseL2Loss=0.0859 + throughput/total_tokens=1,605,312,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8362/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=1,605,504,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8363/500000] + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=1,605,696,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8364/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=1,605,888,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8365/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=1,606,080,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8366/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,606,272,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8367/500000] + train/ActionNoiseL2Loss=0.1126 + throughput/total_tokens=1,606,464,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8368/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,606,656,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=8369/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,606,848,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=8370/500000] + train/ActionNoiseL2Loss=0.0904 + throughput/total_tokens=1,607,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8371/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,607,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8372/500000] + train/ActionNoiseL2Loss=0.1087 + throughput/total_tokens=1,607,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8373/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=1,607,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8374/500000] + train/ActionNoiseL2Loss=0.0863 + throughput/total_tokens=1,607,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8375/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,608,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8376/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=1,608,192,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8377/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=1,608,384,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8378/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=1,608,576,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8379/500000] + train/ActionNoiseL2Loss=0.1388 + throughput/total_tokens=1,608,768,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8380/500000] + optim/total_grad_norm=1.191 + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=1,608,960,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8381/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,609,152,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8382/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,609,344,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8383/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=1,609,536,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8384/500000] + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=1,609,728,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8385/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,609,920,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8386/500000] + train/ActionNoiseL2Loss=0.0893 + throughput/total_tokens=1,610,112,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8387/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,610,304,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8388/500000] + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=1,610,496,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8389/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,610,688,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8390/500000] + train/ActionNoiseL2Loss=0.1196 + throughput/total_tokens=1,610,880,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8391/500000] + train/ActionNoiseL2Loss=0.0299 + throughput/total_tokens=1,611,072,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8392/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,611,264,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8393/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,611,456,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8394/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=1,611,648,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8395/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=1,611,840,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8396/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,612,032,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8397/500000] + train/ActionNoiseL2Loss=0.0313 + throughput/total_tokens=1,612,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8398/500000] + train/ActionNoiseL2Loss=0.1015 + throughput/total_tokens=1,612,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8399/500000] + train/ActionNoiseL2Loss=0.0199 + throughput/total_tokens=1,612,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8400/500000] + optim/total_grad_norm=1.399 + train/ActionNoiseL2Loss=0.0932 + throughput/total_tokens=1,612,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8401/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=1,612,992,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8402/500000] + train/ActionNoiseL2Loss=0.0772 + throughput/total_tokens=1,613,184,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8403/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=1,613,376,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8404/500000] + train/ActionNoiseL2Loss=0.0223 + throughput/total_tokens=1,613,568,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8405/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,613,760,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8406/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,613,952,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8407/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,614,144,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8408/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,614,336,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8409/500000] + train/ActionNoiseL2Loss=0.1652 + throughput/total_tokens=1,614,528,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8410/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=1,614,720,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=8411/500000] + train/ActionNoiseL2Loss=0.1079 + throughput/total_tokens=1,614,912,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8412/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=1,615,104,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8413/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=1,615,296,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8414/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,615,488,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8415/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,615,680,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8416/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=1,615,872,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8417/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=1,616,064,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8418/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,616,256,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8419/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,616,448,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8420/500000] + optim/total_grad_norm=1.106 + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,616,640,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8421/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=1,616,832,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8422/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,617,024,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8423/500000] + train/ActionNoiseL2Loss=0.0851 + throughput/total_tokens=1,617,216,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8424/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,617,408,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8425/500000] + train/ActionNoiseL2Loss=0.0876 + throughput/total_tokens=1,617,600,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8426/500000] + train/ActionNoiseL2Loss=0.0316 + throughput/total_tokens=1,617,792,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8427/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=1,617,984,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8428/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=1,618,176,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8429/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,618,368,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8430/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,618,560,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8431/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,618,752,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8432/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,618,944,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8433/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=1,619,136,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8434/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,619,328,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8435/500000] + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=1,619,520,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8436/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,619,712,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8437/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,619,904,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8438/500000] + train/ActionNoiseL2Loss=0.1029 + throughput/total_tokens=1,620,096,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8439/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=1,620,288,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8440/500000] + optim/total_grad_norm=0.8882 + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=1,620,480,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8441/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,620,672,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8442/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=1,620,864,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8443/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,621,056,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8444/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,621,248,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8445/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,621,440,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8446/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,621,632,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8447/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=1,621,824,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8448/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,622,016,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8449/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,622,208,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8450/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,622,400,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8451/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=1,622,592,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=8452/500000] + train/ActionNoiseL2Loss=0.0233 + throughput/total_tokens=1,622,784,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=8453/500000] + train/ActionNoiseL2Loss=0.0301 + throughput/total_tokens=1,622,976,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=8454/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=1,623,168,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=8455/500000] + train/ActionNoiseL2Loss=0.0155 + throughput/total_tokens=1,623,360,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=8456/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=1,623,552,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=8457/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,623,744,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=8458/500000] + train/ActionNoiseL2Loss=0.0827 + throughput/total_tokens=1,623,936,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=8459/500000] + train/ActionNoiseL2Loss=0.0324 + throughput/total_tokens=1,624,128,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=8460/500000] + optim/total_grad_norm=1.117 + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=1,624,320,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 + System/Peak GPU Memory (MB)=46,467 +[step=8461/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,624,512,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=8462/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=1,624,704,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=8463/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=1,624,896,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=8464/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,625,088,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=8465/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=1,625,280,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=8466/500000] + train/ActionNoiseL2Loss=0.0310 + throughput/total_tokens=1,625,472,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=8467/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,625,664,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=8468/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=1,625,856,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=8469/500000] + train/ActionNoiseL2Loss=0.0251 + throughput/total_tokens=1,626,048,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=8470/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=1,626,240,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8471/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,626,432,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8472/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,626,624,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8473/500000] + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=1,626,816,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8474/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=1,627,008,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8475/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=1,627,200,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8476/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,627,392,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8477/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=1,627,584,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8478/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=1,627,776,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8479/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,627,968,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8480/500000] + optim/total_grad_norm=1.460 + train/ActionNoiseL2Loss=0.0898 + throughput/total_tokens=1,628,160,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8481/500000] + train/ActionNoiseL2Loss=0.0298 + throughput/total_tokens=1,628,352,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8482/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,628,544,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8483/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=1,628,736,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8484/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=1,628,928,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8485/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=1,629,120,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8486/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,629,312,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8487/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=1,629,504,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8488/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=1,629,696,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8489/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=1,629,888,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8490/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,630,080,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8491/500000] + train/ActionNoiseL2Loss=0.1456 + throughput/total_tokens=1,630,272,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8492/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=1,630,464,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8493/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=1,630,656,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8494/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,630,848,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8495/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=1,631,040,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8496/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,631,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8497/500000] + train/ActionNoiseL2Loss=0.0294 + throughput/total_tokens=1,631,424,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8498/500000] + train/ActionNoiseL2Loss=0.0261 + throughput/total_tokens=1,631,616,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8499/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=1,631,808,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8500/500000] + optim/total_grad_norm=1.207 + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=1,632,000,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +10/07 [19:04:29] INFO | >> Saving config... checkpoint.py:608 +10/07 [19:05:13] INFO | >> Saving model state... checkpoint.py:796 +10/07 [19:06:26] INFO | >> Saving optim state... checkpoint.py:811 +10/07 [19:07:52] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=8501/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,632,192,000 + throughput/device/tokens_per_second=1,195 + throughput/device/batches_per_second=0.0498 +[step=8502/500000] + train/ActionNoiseL2Loss=0.0785 + throughput/total_tokens=1,632,384,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8503/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,632,576,000 + throughput/device/tokens_per_second=1,166 + throughput/device/batches_per_second=0.0486 +[step=8504/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=1,632,768,000 + throughput/device/tokens_per_second=1,163 + throughput/device/batches_per_second=0.0485 +[step=8505/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,632,960,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8506/500000] + train/ActionNoiseL2Loss=0.0271 + throughput/total_tokens=1,633,152,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8507/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,633,344,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8508/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=1,633,536,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8509/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,633,728,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8510/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=1,633,920,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8511/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,634,112,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8512/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,634,304,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8513/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=1,634,496,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8514/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=1,634,688,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8515/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=1,634,880,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8516/500000] + train/ActionNoiseL2Loss=0.0287 + throughput/total_tokens=1,635,072,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8517/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,635,264,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8518/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=1,635,456,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8519/500000] + train/ActionNoiseL2Loss=0.0256 + throughput/total_tokens=1,635,648,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8520/500000] + optim/total_grad_norm=1.178 + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,635,840,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8521/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,636,032,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8522/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,636,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8523/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,636,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8524/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=1,636,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8525/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,636,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8526/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,636,992,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8527/500000] + train/ActionNoiseL2Loss=0.0313 + throughput/total_tokens=1,637,184,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8528/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=1,637,376,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8529/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=1,637,568,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8530/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=1,637,760,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8531/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=1,637,952,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8532/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,638,144,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8533/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,638,336,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8534/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,638,528,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8535/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=1,638,720,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8536/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=1,638,912,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8537/500000] + train/ActionNoiseL2Loss=0.0263 + throughput/total_tokens=1,639,104,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8538/500000] + train/ActionNoiseL2Loss=0.0310 + throughput/total_tokens=1,639,296,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8539/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=1,639,488,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8540/500000] + optim/total_grad_norm=1.147 + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,639,680,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8541/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=1,639,872,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8542/500000] + train/ActionNoiseL2Loss=0.0802 + throughput/total_tokens=1,640,064,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8543/500000] + train/ActionNoiseL2Loss=0.0973 + throughput/total_tokens=1,640,256,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8544/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,640,448,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8545/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,640,640,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8546/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=1,640,832,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8547/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=1,641,024,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8548/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=1,641,216,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8549/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=1,641,408,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8550/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,641,600,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8551/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=1,641,792,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8552/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=1,641,984,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8553/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=1,642,176,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8554/500000] + train/ActionNoiseL2Loss=0.0900 + throughput/total_tokens=1,642,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8555/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,642,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8556/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=1,642,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8557/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,642,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8558/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,643,136,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8559/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=1,643,328,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8560/500000] + optim/total_grad_norm=1.524 + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,643,520,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=8561/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,643,712,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8562/500000] + train/ActionNoiseL2Loss=0.0239 + throughput/total_tokens=1,643,904,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8563/500000] + train/ActionNoiseL2Loss=0.0330 + throughput/total_tokens=1,644,096,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8564/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,644,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8565/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=1,644,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8566/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,644,672,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8567/500000] + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=1,644,864,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8568/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,645,056,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8569/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,645,248,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8570/500000] + train/ActionNoiseL2Loss=0.0267 + throughput/total_tokens=1,645,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8571/500000] + train/ActionNoiseL2Loss=0.0272 + throughput/total_tokens=1,645,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8572/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,645,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8573/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,646,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8574/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=1,646,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8575/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,646,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8576/500000] + train/ActionNoiseL2Loss=0.0302 + throughput/total_tokens=1,646,592,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8577/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=1,646,784,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8578/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=1,646,976,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8579/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,647,168,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8580/500000] + optim/total_grad_norm=1.334 + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=1,647,360,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8581/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=1,647,552,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8582/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=1,647,744,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8583/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,647,936,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8584/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,648,128,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8585/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=1,648,320,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8586/500000] + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=1,648,512,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8587/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,648,704,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8588/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,648,896,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8589/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,649,088,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8590/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=1,649,280,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8591/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,649,472,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8592/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,649,664,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8593/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,649,856,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8594/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=1,650,048,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8595/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=1,650,240,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8596/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=1,650,432,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8597/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=1,650,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8598/500000] + train/ActionNoiseL2Loss=0.0314 + throughput/total_tokens=1,650,816,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8599/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,651,008,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8600/500000] + optim/total_grad_norm=1.513 + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,651,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8601/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,651,392,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=8602/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,651,584,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=8603/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=1,651,776,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=8604/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=1,651,968,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=8605/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,652,160,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=8606/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,652,352,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=8607/500000] + train/ActionNoiseL2Loss=0.1027 + throughput/total_tokens=1,652,544,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=8608/500000] + train/ActionNoiseL2Loss=0.0973 + throughput/total_tokens=1,652,736,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=8609/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,652,928,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=8610/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=1,653,120,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=8611/500000] + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=1,653,312,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=8612/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,653,504,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=8613/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=1,653,696,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=8614/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=1,653,888,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=8615/500000] + train/ActionNoiseL2Loss=0.1045 + throughput/total_tokens=1,654,080,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=8616/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,654,272,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=8617/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=1,654,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=8618/500000] + train/ActionNoiseL2Loss=0.0408 + throughput/total_tokens=1,654,656,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=8619/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,654,848,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=8620/500000] + optim/total_grad_norm=1.309 + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=1,655,040,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=8621/500000] + train/ActionNoiseL2Loss=0.0385 + throughput/total_tokens=1,655,232,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8622/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,655,424,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8623/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,655,616,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8624/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=1,655,808,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8625/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,656,000,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8626/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,656,192,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8627/500000] + train/ActionNoiseL2Loss=0.0213 + throughput/total_tokens=1,656,384,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8628/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=1,656,576,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8629/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=1,656,768,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8630/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=1,656,960,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8631/500000] + train/ActionNoiseL2Loss=0.0411 + throughput/total_tokens=1,657,152,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8632/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,657,344,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8633/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=1,657,536,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8634/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,657,728,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8635/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=1,657,920,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8636/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=1,658,112,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8637/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,658,304,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8638/500000] + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=1,658,496,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8639/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=1,658,688,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8640/500000] + optim/total_grad_norm=1.151 + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=1,658,880,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8641/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,659,072,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8642/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,659,264,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8643/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=1,659,456,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8644/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=1,659,648,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8645/500000] + train/ActionNoiseL2Loss=0.1122 + throughput/total_tokens=1,659,840,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8646/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=1,660,032,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8647/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=1,660,224,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8648/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=1,660,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8649/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=1,660,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8650/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,660,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8651/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,660,992,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8652/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=1,661,184,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8653/500000] + train/ActionNoiseL2Loss=0.0344 + throughput/total_tokens=1,661,376,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8654/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,661,568,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8655/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=1,661,760,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8656/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=1,661,952,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8657/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=1,662,144,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8658/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=1,662,336,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8659/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=1,662,528,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8660/500000] + optim/total_grad_norm=1.076 + train/ActionNoiseL2Loss=0.0238 + throughput/total_tokens=1,662,720,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=8661/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,662,912,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8662/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,663,104,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8663/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=1,663,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8664/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=1,663,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8665/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,663,680,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8666/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=1,663,872,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8667/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,664,064,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8668/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=1,664,256,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8669/500000] + train/ActionNoiseL2Loss=0.0361 + throughput/total_tokens=1,664,448,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8670/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,664,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8671/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,664,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8672/500000] + train/ActionNoiseL2Loss=0.0344 + throughput/total_tokens=1,665,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8673/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=1,665,216,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8674/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,665,408,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8675/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=1,665,600,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8676/500000] + train/ActionNoiseL2Loss=0.0209 + throughput/total_tokens=1,665,792,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8677/500000] + train/ActionNoiseL2Loss=0.0281 + throughput/total_tokens=1,665,984,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8678/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,666,176,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8679/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,666,368,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8680/500000] + optim/total_grad_norm=1.437 + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,666,560,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8681/500000] + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=1,666,752,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8682/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,666,944,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8683/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,667,136,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8684/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=1,667,328,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8685/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=1,667,520,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8686/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=1,667,712,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8687/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=1,667,904,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8688/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=1,668,096,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8689/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=1,668,288,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8690/500000] + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=1,668,480,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8691/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=1,668,672,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8692/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=1,668,864,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8693/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=1,669,056,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8694/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,669,248,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8695/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,669,440,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8696/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,669,632,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8697/500000] + train/ActionNoiseL2Loss=0.0299 + throughput/total_tokens=1,669,824,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8698/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=1,670,016,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8699/500000] + train/ActionNoiseL2Loss=0.1180 + throughput/total_tokens=1,670,208,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8700/500000] + optim/total_grad_norm=1.484 + train/ActionNoiseL2Loss=0.0950 + throughput/total_tokens=1,670,400,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8701/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=1,670,592,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8702/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,670,784,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8703/500000] + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=1,670,976,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8704/500000] + train/ActionNoiseL2Loss=0.0286 + throughput/total_tokens=1,671,168,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8705/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,671,360,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8706/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=1,671,552,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8707/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,671,744,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8708/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=1,671,936,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8709/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=1,672,128,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8710/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,672,320,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8711/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,672,512,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8712/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,672,704,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8713/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,672,896,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8714/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,673,088,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8715/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,673,280,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8716/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,673,472,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8717/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,673,664,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8718/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,673,856,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8719/500000] + train/ActionNoiseL2Loss=0.1037 + throughput/total_tokens=1,674,048,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8720/500000] + optim/total_grad_norm=1.048 + train/ActionNoiseL2Loss=0.0316 + throughput/total_tokens=1,674,240,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8721/500000] + train/ActionNoiseL2Loss=0.0343 + throughput/total_tokens=1,674,432,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8722/500000] + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=1,674,624,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8723/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=1,674,816,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8724/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,675,008,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8725/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,675,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8726/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,675,392,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8727/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=1,675,584,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8728/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,675,776,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8729/500000] + train/ActionNoiseL2Loss=0.0343 + throughput/total_tokens=1,675,968,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8730/500000] + train/ActionNoiseL2Loss=0.1123 + throughput/total_tokens=1,676,160,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8731/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,676,352,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8732/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,676,544,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8733/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,676,736,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8734/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=1,676,928,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8735/500000] + train/ActionNoiseL2Loss=0.0957 + throughput/total_tokens=1,677,120,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8736/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=1,677,312,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8737/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,677,504,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8738/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=1,677,696,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8739/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,677,888,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8740/500000] + optim/total_grad_norm=1.461 + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,678,080,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8741/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=1,678,272,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8742/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=1,678,464,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8743/500000] + train/ActionNoiseL2Loss=0.0195 + throughput/total_tokens=1,678,656,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8744/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=1,678,848,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8745/500000] + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=1,679,040,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8746/500000] + train/ActionNoiseL2Loss=0.0959 + throughput/total_tokens=1,679,232,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8747/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,679,424,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8748/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,679,616,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8749/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=1,679,808,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8750/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,680,000,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8751/500000] + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=1,680,192,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8752/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,680,384,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8753/500000] + train/ActionNoiseL2Loss=0.1034 + throughput/total_tokens=1,680,576,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8754/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=1,680,768,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8755/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,680,960,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8756/500000] + train/ActionNoiseL2Loss=0.0335 + throughput/total_tokens=1,681,152,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8757/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,681,344,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8758/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,681,536,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8759/500000] + train/ActionNoiseL2Loss=0.0335 + throughput/total_tokens=1,681,728,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8760/500000] + optim/total_grad_norm=1.135 + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,681,920,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8761/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,682,112,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8762/500000] + train/ActionNoiseL2Loss=0.0945 + throughput/total_tokens=1,682,304,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8763/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,682,496,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8764/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,682,688,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8765/500000] + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=1,682,880,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8766/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,683,072,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8767/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,683,264,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8768/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,683,456,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8769/500000] + train/ActionNoiseL2Loss=0.0220 + throughput/total_tokens=1,683,648,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8770/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,683,840,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8771/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=1,684,032,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8772/500000] + train/ActionNoiseL2Loss=0.1062 + throughput/total_tokens=1,684,224,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8773/500000] + train/ActionNoiseL2Loss=0.0355 + throughput/total_tokens=1,684,416,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8774/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=1,684,608,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8775/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=1,684,800,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8776/500000] + train/ActionNoiseL2Loss=0.0264 + throughput/total_tokens=1,684,992,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8777/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,685,184,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8778/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,685,376,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8779/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,685,568,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8780/500000] + optim/total_grad_norm=1.678 + train/ActionNoiseL2Loss=0.0954 + throughput/total_tokens=1,685,760,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8781/500000] + train/ActionNoiseL2Loss=0.0316 + throughput/total_tokens=1,685,952,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8782/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=1,686,144,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8783/500000] + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=1,686,336,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8784/500000] + train/ActionNoiseL2Loss=0.0385 + throughput/total_tokens=1,686,528,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8785/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=1,686,720,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8786/500000] + train/ActionNoiseL2Loss=0.0320 + throughput/total_tokens=1,686,912,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8787/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,687,104,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8788/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=1,687,296,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8789/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=1,687,488,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8790/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=1,687,680,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8791/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=1,687,872,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8792/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=1,688,064,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8793/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,688,256,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8794/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=1,688,448,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8795/500000] + train/ActionNoiseL2Loss=0.0266 + throughput/total_tokens=1,688,640,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8796/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=1,688,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8797/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=1,689,024,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8798/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=1,689,216,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8799/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,689,408,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8800/500000] + optim/total_grad_norm=1.315 + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=1,689,600,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8801/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,689,792,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8802/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,689,984,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8803/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=1,690,176,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8804/500000] + train/ActionNoiseL2Loss=0.0858 + throughput/total_tokens=1,690,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8805/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,690,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8806/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,690,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=8807/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,690,944,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8808/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=1,691,136,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8809/500000] + train/ActionNoiseL2Loss=0.0339 + throughput/total_tokens=1,691,328,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8810/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,691,520,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=8811/500000] + train/ActionNoiseL2Loss=0.0934 + throughput/total_tokens=1,691,712,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8812/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=1,691,904,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8813/500000] + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=1,692,096,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8814/500000] + train/ActionNoiseL2Loss=0.1052 + throughput/total_tokens=1,692,288,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8815/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=1,692,480,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8816/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=1,692,672,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8817/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,692,864,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8818/500000] + train/ActionNoiseL2Loss=0.0918 + throughput/total_tokens=1,693,056,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8819/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=1,693,248,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8820/500000] + optim/total_grad_norm=2.050 + train/ActionNoiseL2Loss=0.0978 + throughput/total_tokens=1,693,440,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8821/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,693,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8822/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,693,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8823/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=1,694,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8824/500000] + train/ActionNoiseL2Loss=0.0306 + throughput/total_tokens=1,694,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8825/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=1,694,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8826/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,694,592,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8827/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,694,784,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8828/500000] + train/ActionNoiseL2Loss=0.0285 + throughput/total_tokens=1,694,976,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8829/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,695,168,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8830/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=1,695,360,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8831/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=1,695,552,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8832/500000] + train/ActionNoiseL2Loss=0.1589 + throughput/total_tokens=1,695,744,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8833/500000] + train/ActionNoiseL2Loss=0.0886 + throughput/total_tokens=1,695,936,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8834/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,696,128,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8835/500000] + train/ActionNoiseL2Loss=0.1228 + throughput/total_tokens=1,696,320,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8836/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,696,512,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8837/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=1,696,704,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8838/500000] + train/ActionNoiseL2Loss=0.1253 + throughput/total_tokens=1,696,896,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8839/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,697,088,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8840/500000] + optim/total_grad_norm=1.111 + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,697,280,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8841/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=1,697,472,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8842/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,697,664,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8843/500000] + train/ActionNoiseL2Loss=0.0256 + throughput/total_tokens=1,697,856,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8844/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,698,048,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8845/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,698,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8846/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,698,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8847/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=1,698,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8848/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=1,698,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8849/500000] + train/ActionNoiseL2Loss=0.0741 + throughput/total_tokens=1,699,008,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8850/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,699,200,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8851/500000] + train/ActionNoiseL2Loss=0.0262 + throughput/total_tokens=1,699,392,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8852/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,699,584,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8853/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=1,699,776,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8854/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=1,699,968,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8855/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=1,700,160,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8856/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,700,352,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8857/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,700,544,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8858/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=1,700,736,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8859/500000] + train/ActionNoiseL2Loss=0.0345 + throughput/total_tokens=1,700,928,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8860/500000] + optim/total_grad_norm=1.002 + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,701,120,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8861/500000] + train/ActionNoiseL2Loss=0.1074 + throughput/total_tokens=1,701,312,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8862/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,701,504,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8863/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,701,696,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8864/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=1,701,888,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8865/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=1,702,080,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8866/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,702,272,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8867/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,702,464,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8868/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,702,656,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8869/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=1,702,848,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8870/500000] + train/ActionNoiseL2Loss=0.0865 + throughput/total_tokens=1,703,040,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8871/500000] + train/ActionNoiseL2Loss=0.0228 + throughput/total_tokens=1,703,232,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8872/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=1,703,424,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8873/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,703,616,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8874/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=1,703,808,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8875/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,704,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8876/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,704,192,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8877/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=1,704,384,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8878/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,704,576,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8879/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,704,768,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8880/500000] + optim/total_grad_norm=1.149 + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,704,960,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8881/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=1,705,152,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8882/500000] + train/ActionNoiseL2Loss=0.0788 + throughput/total_tokens=1,705,344,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8883/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,705,536,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8884/500000] + train/ActionNoiseL2Loss=0.1273 + throughput/total_tokens=1,705,728,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8885/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,705,920,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8886/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=1,706,112,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8887/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=1,706,304,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8888/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=1,706,496,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8889/500000] + train/ActionNoiseL2Loss=0.0264 + throughput/total_tokens=1,706,688,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8890/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,706,880,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8891/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,707,072,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8892/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=1,707,264,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8893/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,707,456,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8894/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,707,648,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8895/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,707,840,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8896/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,708,032,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8897/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,708,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8898/500000] + train/ActionNoiseL2Loss=0.0249 + throughput/total_tokens=1,708,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8899/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=1,708,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8900/500000] + optim/total_grad_norm=1.151 + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,708,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8901/500000] + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=1,708,992,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8902/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,709,184,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8903/500000] + train/ActionNoiseL2Loss=0.1006 + throughput/total_tokens=1,709,376,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8904/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,709,568,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8905/500000] + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=1,709,760,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8906/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,709,952,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8907/500000] + train/ActionNoiseL2Loss=0.1054 + throughput/total_tokens=1,710,144,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8908/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=1,710,336,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8909/500000] + train/ActionNoiseL2Loss=0.1009 + throughput/total_tokens=1,710,528,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8910/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,710,720,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8911/500000] + train/ActionNoiseL2Loss=0.0329 + throughput/total_tokens=1,710,912,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8912/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=1,711,104,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8913/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=1,711,296,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8914/500000] + train/ActionNoiseL2Loss=0.0284 + throughput/total_tokens=1,711,488,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8915/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,711,680,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8916/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=1,711,872,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8917/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=1,712,064,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8918/500000] + train/ActionNoiseL2Loss=0.0361 + throughput/total_tokens=1,712,256,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8919/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=1,712,448,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=8920/500000] + optim/total_grad_norm=1.042 + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,712,640,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8921/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=1,712,832,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8922/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,713,024,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8923/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=1,713,216,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8924/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=1,713,408,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8925/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,713,600,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8926/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=1,713,792,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8927/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,713,984,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8928/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=1,714,176,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8929/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,714,368,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8930/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,714,560,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8931/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,714,752,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8932/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,714,944,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8933/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=1,715,136,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8934/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,715,328,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8935/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=1,715,520,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8936/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=1,715,712,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8937/500000] + train/ActionNoiseL2Loss=0.0324 + throughput/total_tokens=1,715,904,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8938/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=1,716,096,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8939/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,716,288,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8940/500000] + optim/total_grad_norm=1.110 + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=1,716,480,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8941/500000] + train/ActionNoiseL2Loss=0.1101 + throughput/total_tokens=1,716,672,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8942/500000] + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=1,716,864,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=8943/500000] + train/ActionNoiseL2Loss=0.0968 + throughput/total_tokens=1,717,056,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8944/500000] + train/ActionNoiseL2Loss=0.0291 + throughput/total_tokens=1,717,248,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8945/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,717,440,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8946/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,717,632,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8947/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=1,717,824,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8948/500000] + train/ActionNoiseL2Loss=0.0367 + throughput/total_tokens=1,718,016,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8949/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=1,718,208,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=8950/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,718,400,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8951/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=1,718,592,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8952/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,718,784,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8953/500000] + train/ActionNoiseL2Loss=0.0309 + throughput/total_tokens=1,718,976,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8954/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=1,719,168,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8955/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,719,360,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8956/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=1,719,552,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8957/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=1,719,744,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8958/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,719,936,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8959/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,720,128,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8960/500000] + optim/total_grad_norm=1.371 + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,720,320,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=8961/500000] + train/ActionNoiseL2Loss=0.1429 + throughput/total_tokens=1,720,512,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8962/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,720,704,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8963/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,720,896,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8964/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,721,088,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8965/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,721,280,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8966/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=1,721,472,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8967/500000] + train/ActionNoiseL2Loss=0.0866 + throughput/total_tokens=1,721,664,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8968/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=1,721,856,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8969/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,722,048,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=8970/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=1,722,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8971/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,722,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8972/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,722,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8973/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=1,722,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8974/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,723,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8975/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=1,723,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8976/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=1,723,392,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8977/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,723,584,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8978/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=1,723,776,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8979/500000] + train/ActionNoiseL2Loss=0.1041 + throughput/total_tokens=1,723,968,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8980/500000] + optim/total_grad_norm=0.8865 + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=1,724,160,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=8981/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,724,352,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8982/500000] + train/ActionNoiseL2Loss=0.0324 + throughput/total_tokens=1,724,544,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8983/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,724,736,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8984/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,724,928,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8985/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,725,120,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8986/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,725,312,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=8987/500000] + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=1,725,504,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8988/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=1,725,696,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8989/500000] + train/ActionNoiseL2Loss=0.0370 + throughput/total_tokens=1,725,888,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8990/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,726,080,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=8991/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,726,272,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8992/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=1,726,464,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8993/500000] + train/ActionNoiseL2Loss=0.0199 + throughput/total_tokens=1,726,656,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=8994/500000] + train/ActionNoiseL2Loss=0.0291 + throughput/total_tokens=1,726,848,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8995/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=1,727,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8996/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=1,727,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8997/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=1,727,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8998/500000] + train/ActionNoiseL2Loss=0.1148 + throughput/total_tokens=1,727,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=8999/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=1,727,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9000/500000] + optim/total_grad_norm=1.361 + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,728,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +10/07 [22:02:12] INFO | >> Saving config... checkpoint.py:608 +10/07 [22:02:43] INFO | >> Saving model state... checkpoint.py:796 +10/07 [22:03:57] INFO | >> Saving optim state... checkpoint.py:811 +10/07 [22:05:29] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=9001/500000] + train/ActionNoiseL2Loss=0.0276 + throughput/total_tokens=1,728,192,000 + throughput/device/tokens_per_second=1,191 + throughput/device/batches_per_second=0.0497 +[step=9002/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,728,384,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9003/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,728,576,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=9004/500000] + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=1,728,768,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9005/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=1,728,960,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9006/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=1,729,152,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=9007/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,729,344,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=9008/500000] + train/ActionNoiseL2Loss=0.0289 + throughput/total_tokens=1,729,536,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=9009/500000] + train/ActionNoiseL2Loss=0.1026 + throughput/total_tokens=1,729,728,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=9010/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=1,729,920,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=9011/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=1,730,112,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=9012/500000] + train/ActionNoiseL2Loss=0.0849 + throughput/total_tokens=1,730,304,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=9013/500000] + train/ActionNoiseL2Loss=0.0289 + throughput/total_tokens=1,730,496,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=9014/500000] + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=1,730,688,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9015/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=1,730,880,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9016/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,731,072,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9017/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,731,264,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9018/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,731,456,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9019/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=1,731,648,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9020/500000] + optim/total_grad_norm=1.597 + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,731,840,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=9021/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=1,732,032,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=9022/500000] + train/ActionNoiseL2Loss=0.0282 + throughput/total_tokens=1,732,224,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9023/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,732,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9024/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,732,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9025/500000] + train/ActionNoiseL2Loss=0.0236 + throughput/total_tokens=1,732,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9026/500000] + train/ActionNoiseL2Loss=0.0281 + throughput/total_tokens=1,732,992,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9027/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,733,184,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9028/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=1,733,376,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9029/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,733,568,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9030/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,733,760,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9031/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,733,952,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9032/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,734,144,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9033/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,734,336,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9034/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=1,734,528,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9035/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,734,720,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9036/500000] + train/ActionNoiseL2Loss=0.0979 + throughput/total_tokens=1,734,912,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9037/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,735,104,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9038/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=1,735,296,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9039/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=1,735,488,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9040/500000] + optim/total_grad_norm=0.7212 + train/ActionNoiseL2Loss=0.0237 + throughput/total_tokens=1,735,680,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9041/500000] + train/ActionNoiseL2Loss=0.0303 + throughput/total_tokens=1,735,872,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9042/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=1,736,064,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9043/500000] + train/ActionNoiseL2Loss=0.0983 + throughput/total_tokens=1,736,256,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9044/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=1,736,448,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9045/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,736,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9046/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,736,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9047/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,737,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9048/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,737,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9049/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=1,737,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9050/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,737,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9051/500000] + train/ActionNoiseL2Loss=0.0993 + throughput/total_tokens=1,737,792,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=9052/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,737,984,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9053/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,738,176,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9054/500000] + train/ActionNoiseL2Loss=0.0237 + throughput/total_tokens=1,738,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9055/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,738,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9056/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=1,738,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9057/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,738,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9058/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=1,739,136,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9059/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=1,739,328,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9060/500000] + optim/total_grad_norm=0.9328 + train/ActionNoiseL2Loss=0.0200 + throughput/total_tokens=1,739,520,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=9061/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=1,739,712,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9062/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,739,904,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9063/500000] + train/ActionNoiseL2Loss=0.0911 + throughput/total_tokens=1,740,096,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9064/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=1,740,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9065/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=1,740,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9066/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,740,672,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9067/500000] + train/ActionNoiseL2Loss=0.1083 + throughput/total_tokens=1,740,864,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9068/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,741,056,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9069/500000] + train/ActionNoiseL2Loss=0.0941 + throughput/total_tokens=1,741,248,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9070/500000] + train/ActionNoiseL2Loss=0.1085 + throughput/total_tokens=1,741,440,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9071/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,741,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9072/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,741,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9073/500000] + train/ActionNoiseL2Loss=0.0271 + throughput/total_tokens=1,742,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9074/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=1,742,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9075/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=1,742,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9076/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=1,742,592,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9077/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,742,784,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9078/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,742,976,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9079/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=1,743,168,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9080/500000] + optim/total_grad_norm=0.9988 + train/ActionNoiseL2Loss=0.0287 + throughput/total_tokens=1,743,360,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9081/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=1,743,552,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9082/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,743,744,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9083/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=1,743,936,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9084/500000] + train/ActionNoiseL2Loss=0.0836 + throughput/total_tokens=1,744,128,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9085/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=1,744,320,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9086/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,744,512,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9087/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,744,704,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9088/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,744,896,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9089/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,745,088,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9090/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,745,280,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9091/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,745,472,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9092/500000] + train/ActionNoiseL2Loss=0.1312 + throughput/total_tokens=1,745,664,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9093/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=1,745,856,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9094/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=1,746,048,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9095/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,746,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9096/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,746,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9097/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,746,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9098/500000] + train/ActionNoiseL2Loss=0.0241 + throughput/total_tokens=1,746,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9099/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,747,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9100/500000] + optim/total_grad_norm=1.543 + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,747,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9101/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=1,747,392,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9102/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=1,747,584,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9103/500000] + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=1,747,776,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9104/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=1,747,968,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9105/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,748,160,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9106/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=1,748,352,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9107/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,748,544,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9108/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=1,748,736,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9109/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,748,928,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9110/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=1,749,120,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=9111/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,749,312,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9112/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=1,749,504,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9113/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=1,749,696,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9114/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,749,888,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9115/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,750,080,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9116/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=1,750,272,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9117/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,750,464,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9118/500000] + train/ActionNoiseL2Loss=0.0224 + throughput/total_tokens=1,750,656,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9119/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,750,848,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9120/500000] + optim/total_grad_norm=1.058 + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=1,751,040,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9121/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=1,751,232,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9122/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,751,424,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9123/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,751,616,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9124/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=1,751,808,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9125/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=1,752,000,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9126/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,752,192,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9127/500000] + train/ActionNoiseL2Loss=0.0245 + throughput/total_tokens=1,752,384,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9128/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,752,576,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9129/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,752,768,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9130/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=1,752,960,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9131/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,753,152,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9132/500000] + train/ActionNoiseL2Loss=0.0691 + throughput/total_tokens=1,753,344,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9133/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,753,536,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9134/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=1,753,728,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9135/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,753,920,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9136/500000] + train/ActionNoiseL2Loss=0.0946 + throughput/total_tokens=1,754,112,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9137/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,754,304,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9138/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=1,754,496,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9139/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=1,754,688,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9140/500000] + optim/total_grad_norm=1.260 + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=1,754,880,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9141/500000] + train/ActionNoiseL2Loss=0.0262 + throughput/total_tokens=1,755,072,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9142/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=1,755,264,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9143/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,755,456,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9144/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,755,648,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9145/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,755,840,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9146/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,756,032,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9147/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=1,756,224,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9148/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,756,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9149/500000] + train/ActionNoiseL2Loss=0.0263 + throughput/total_tokens=1,756,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9150/500000] + train/ActionNoiseL2Loss=0.0225 + throughput/total_tokens=1,756,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9151/500000] + train/ActionNoiseL2Loss=0.0204 + throughput/total_tokens=1,756,992,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9152/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=1,757,184,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9153/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,757,376,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9154/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,757,568,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9155/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=1,757,760,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9156/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=1,757,952,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9157/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,758,144,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9158/500000] + train/ActionNoiseL2Loss=0.0241 + throughput/total_tokens=1,758,336,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9159/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=1,758,528,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9160/500000] + optim/total_grad_norm=1.357 + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=1,758,720,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=9161/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,758,912,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9162/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,759,104,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9163/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=1,759,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9164/500000] + train/ActionNoiseL2Loss=0.0216 + throughput/total_tokens=1,759,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9165/500000] + train/ActionNoiseL2Loss=0.0363 + throughput/total_tokens=1,759,680,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9166/500000] + train/ActionNoiseL2Loss=0.0178 + throughput/total_tokens=1,759,872,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9167/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,760,064,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9168/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=1,760,256,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9169/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,760,448,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9170/500000] + train/ActionNoiseL2Loss=0.1344 + throughput/total_tokens=1,760,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9171/500000] + train/ActionNoiseL2Loss=0.0246 + throughput/total_tokens=1,760,832,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9172/500000] + train/ActionNoiseL2Loss=0.0914 + throughput/total_tokens=1,761,024,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9173/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,761,216,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9174/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=1,761,408,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9175/500000] + train/ActionNoiseL2Loss=0.1008 + throughput/total_tokens=1,761,600,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9176/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,761,792,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9177/500000] + train/ActionNoiseL2Loss=0.0335 + throughput/total_tokens=1,761,984,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9178/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,762,176,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9179/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=1,762,368,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9180/500000] + optim/total_grad_norm=1.302 + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,762,560,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9181/500000] + train/ActionNoiseL2Loss=0.0928 + throughput/total_tokens=1,762,752,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9182/500000] + train/ActionNoiseL2Loss=0.1032 + throughput/total_tokens=1,762,944,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9183/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,763,136,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9184/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=1,763,328,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9185/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,763,520,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9186/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,763,712,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9187/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,763,904,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9188/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=1,764,096,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9189/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=1,764,288,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9190/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,764,480,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9191/500000] + train/ActionNoiseL2Loss=0.0343 + throughput/total_tokens=1,764,672,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9192/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,764,864,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9193/500000] + train/ActionNoiseL2Loss=0.0258 + throughput/total_tokens=1,765,056,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9194/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=1,765,248,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9195/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=1,765,440,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9196/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,765,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9197/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=1,765,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9198/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=1,766,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9199/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=1,766,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9200/500000] + optim/total_grad_norm=1.065 + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,766,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9201/500000] + train/ActionNoiseL2Loss=0.1384 + throughput/total_tokens=1,766,592,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9202/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=1,766,784,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9203/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,766,976,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9204/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=1,767,168,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9205/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=1,767,360,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9206/500000] + train/ActionNoiseL2Loss=0.0339 + throughput/total_tokens=1,767,552,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9207/500000] + train/ActionNoiseL2Loss=0.0330 + throughput/total_tokens=1,767,744,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9208/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=1,767,936,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9209/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,768,128,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9210/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,768,320,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=9211/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=1,768,512,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9212/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,768,704,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9213/500000] + train/ActionNoiseL2Loss=0.0256 + throughput/total_tokens=1,768,896,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9214/500000] + train/ActionNoiseL2Loss=0.0145 + throughput/total_tokens=1,769,088,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9215/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,769,280,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9216/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,769,472,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9217/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,769,664,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9218/500000] + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=1,769,856,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9219/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=1,770,048,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9220/500000] + optim/total_grad_norm=0.7313 + train/ActionNoiseL2Loss=0.0149 + throughput/total_tokens=1,770,240,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9221/500000] + train/ActionNoiseL2Loss=0.0259 + throughput/total_tokens=1,770,432,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9222/500000] + train/ActionNoiseL2Loss=0.0878 + throughput/total_tokens=1,770,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9223/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=1,770,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9224/500000] + train/ActionNoiseL2Loss=0.0300 + throughput/total_tokens=1,771,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9225/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,771,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9226/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,771,392,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9227/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,771,584,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9228/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,771,776,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9229/500000] + train/ActionNoiseL2Loss=0.0289 + throughput/total_tokens=1,771,968,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9230/500000] + train/ActionNoiseL2Loss=0.0324 + throughput/total_tokens=1,772,160,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9231/500000] + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=1,772,352,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9232/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,772,544,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9233/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=1,772,736,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9234/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,772,928,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9235/500000] + train/ActionNoiseL2Loss=0.0932 + throughput/total_tokens=1,773,120,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9236/500000] + train/ActionNoiseL2Loss=0.0262 + throughput/total_tokens=1,773,312,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9237/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,773,504,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9238/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,773,696,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9239/500000] + train/ActionNoiseL2Loss=0.0290 + throughput/total_tokens=1,773,888,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9240/500000] + optim/total_grad_norm=1.606 + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=1,774,080,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9241/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=1,774,272,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9242/500000] + train/ActionNoiseL2Loss=0.1071 + throughput/total_tokens=1,774,464,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9243/500000] + train/ActionNoiseL2Loss=0.0935 + throughput/total_tokens=1,774,656,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9244/500000] + train/ActionNoiseL2Loss=0.0809 + throughput/total_tokens=1,774,848,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9245/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,775,040,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9246/500000] + train/ActionNoiseL2Loss=0.0229 + throughput/total_tokens=1,775,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9247/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=1,775,424,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9248/500000] + train/ActionNoiseL2Loss=0.1062 + throughput/total_tokens=1,775,616,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9249/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=1,775,808,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9250/500000] + train/ActionNoiseL2Loss=0.1121 + throughput/total_tokens=1,776,000,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9251/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=1,776,192,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9252/500000] + train/ActionNoiseL2Loss=0.0902 + throughput/total_tokens=1,776,384,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9253/500000] + train/ActionNoiseL2Loss=0.0244 + throughput/total_tokens=1,776,576,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9254/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=1,776,768,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9255/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,776,960,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9256/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,777,152,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9257/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=1,777,344,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9258/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=1,777,536,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9259/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,777,728,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9260/500000] + optim/total_grad_norm=1.212 + train/ActionNoiseL2Loss=0.0287 + throughput/total_tokens=1,777,920,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9261/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=1,778,112,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9262/500000] + train/ActionNoiseL2Loss=0.0853 + throughput/total_tokens=1,778,304,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9263/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=1,778,496,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9264/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,778,688,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9265/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=1,778,880,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9266/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,779,072,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9267/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,779,264,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9268/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,779,456,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9269/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,779,648,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9270/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=1,779,840,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9271/500000] + train/ActionNoiseL2Loss=0.1211 + throughput/total_tokens=1,780,032,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9272/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=1,780,224,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9273/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=1,780,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9274/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,780,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9275/500000] + train/ActionNoiseL2Loss=0.1010 + throughput/total_tokens=1,780,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9276/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,780,992,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9277/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=1,781,184,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9278/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,781,376,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9279/500000] + train/ActionNoiseL2Loss=0.0335 + throughput/total_tokens=1,781,568,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9280/500000] + optim/total_grad_norm=1.140 + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=1,781,760,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9281/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=1,781,952,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9282/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,782,144,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9283/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=1,782,336,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9284/500000] + train/ActionNoiseL2Loss=0.0205 + throughput/total_tokens=1,782,528,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9285/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=1,782,720,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9286/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,782,912,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9287/500000] + train/ActionNoiseL2Loss=0.0832 + throughput/total_tokens=1,783,104,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9288/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,783,296,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9289/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,783,488,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9290/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=1,783,680,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9291/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,783,872,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9292/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=1,784,064,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9293/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,784,256,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9294/500000] + train/ActionNoiseL2Loss=0.0253 + throughput/total_tokens=1,784,448,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9295/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=1,784,640,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9296/500000] + train/ActionNoiseL2Loss=0.0292 + throughput/total_tokens=1,784,832,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9297/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,785,024,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9298/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=1,785,216,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9299/500000] + train/ActionNoiseL2Loss=0.0940 + throughput/total_tokens=1,785,408,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9300/500000] + optim/total_grad_norm=1.080 + train/ActionNoiseL2Loss=0.0234 + throughput/total_tokens=1,785,600,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9301/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=1,785,792,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9302/500000] + train/ActionNoiseL2Loss=0.0276 + throughput/total_tokens=1,785,984,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9303/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=1,786,176,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9304/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,786,368,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9305/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,786,560,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9306/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=1,786,752,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9307/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=1,786,944,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9308/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=1,787,136,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9309/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,787,328,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9310/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=1,787,520,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=9311/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,787,712,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9312/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,787,904,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9313/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,788,096,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9314/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=1,788,288,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9315/500000] + train/ActionNoiseL2Loss=0.1019 + throughput/total_tokens=1,788,480,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9316/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,788,672,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9317/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,788,864,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9318/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,789,056,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9319/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=1,789,248,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9320/500000] + optim/total_grad_norm=1.246 + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,789,440,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9321/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,789,632,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9322/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,789,824,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9323/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,790,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9324/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=1,790,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9325/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=1,790,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9326/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,790,592,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9327/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=1,790,784,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9328/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,790,976,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9329/500000] + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=1,791,168,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9330/500000] + train/ActionNoiseL2Loss=0.0256 + throughput/total_tokens=1,791,360,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9331/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=1,791,552,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9332/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=1,791,744,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9333/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,791,936,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9334/500000] + train/ActionNoiseL2Loss=0.0308 + throughput/total_tokens=1,792,128,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9335/500000] + train/ActionNoiseL2Loss=0.0242 + throughput/total_tokens=1,792,320,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9336/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=1,792,512,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9337/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,792,704,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9338/500000] + train/ActionNoiseL2Loss=0.0410 + throughput/total_tokens=1,792,896,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9339/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=1,793,088,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9340/500000] + optim/total_grad_norm=1.416 + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=1,793,280,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9341/500000] + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=1,793,472,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9342/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=1,793,664,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9343/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=1,793,856,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9344/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=1,794,048,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9345/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,794,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9346/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=1,794,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9347/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=1,794,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9348/500000] + train/ActionNoiseL2Loss=0.0270 + throughput/total_tokens=1,794,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9349/500000] + train/ActionNoiseL2Loss=0.1102 + throughput/total_tokens=1,795,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9350/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,795,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9351/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=1,795,392,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9352/500000] + train/ActionNoiseL2Loss=0.0311 + throughput/total_tokens=1,795,584,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9353/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,795,776,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9354/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,795,968,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9355/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,796,160,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9356/500000] + train/ActionNoiseL2Loss=0.0285 + throughput/total_tokens=1,796,352,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9357/500000] + train/ActionNoiseL2Loss=0.0947 + throughput/total_tokens=1,796,544,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9358/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,796,736,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9359/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=1,796,928,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9360/500000] + optim/total_grad_norm=1.230 + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=1,797,120,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=9361/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=1,797,312,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9362/500000] + train/ActionNoiseL2Loss=0.0296 + throughput/total_tokens=1,797,504,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9363/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,797,696,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9364/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,797,888,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9365/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,798,080,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9366/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=1,798,272,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9367/500000] + train/ActionNoiseL2Loss=0.0302 + throughput/total_tokens=1,798,464,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9368/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=1,798,656,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9369/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,798,848,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9370/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,799,040,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9371/500000] + train/ActionNoiseL2Loss=0.0273 + throughput/total_tokens=1,799,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9372/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,799,424,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9373/500000] + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=1,799,616,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9374/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=1,799,808,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9375/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,800,000,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9376/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=1,800,192,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9377/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,800,384,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9378/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,800,576,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9379/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,800,768,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9380/500000] + optim/total_grad_norm=1.107 + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,800,960,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9381/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=1,801,152,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9382/500000] + train/ActionNoiseL2Loss=0.0281 + throughput/total_tokens=1,801,344,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9383/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,801,536,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9384/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=1,801,728,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9385/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=1,801,920,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9386/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=1,802,112,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9387/500000] + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=1,802,304,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9388/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,802,496,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9389/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=1,802,688,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9390/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,802,880,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9391/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=1,803,072,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9392/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=1,803,264,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9393/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=1,803,456,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9394/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=1,803,648,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9395/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,803,840,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9396/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,804,032,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9397/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=1,804,224,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9398/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,804,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9399/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=1,804,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9400/500000] + optim/total_grad_norm=0.9702 + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=1,804,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9401/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,804,992,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9402/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=1,805,184,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9403/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,805,376,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9404/500000] + train/ActionNoiseL2Loss=0.0224 + throughput/total_tokens=1,805,568,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9405/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,805,760,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9406/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=1,805,952,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9407/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,806,144,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9408/500000] + train/ActionNoiseL2Loss=0.1012 + throughput/total_tokens=1,806,336,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9409/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=1,806,528,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9410/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,806,720,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=9411/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=1,806,912,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9412/500000] + train/ActionNoiseL2Loss=0.0196 + throughput/total_tokens=1,807,104,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9413/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,807,296,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9414/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=1,807,488,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9415/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=1,807,680,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9416/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,807,872,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9417/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=1,808,064,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9418/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,808,256,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9419/500000] + train/ActionNoiseL2Loss=0.0252 + throughput/total_tokens=1,808,448,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9420/500000] + optim/total_grad_norm=1.188 + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,808,640,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9421/500000] + train/ActionNoiseL2Loss=0.0293 + throughput/total_tokens=1,808,832,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9422/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,809,024,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9423/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=1,809,216,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9424/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=1,809,408,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9425/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,809,600,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9426/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=1,809,792,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9427/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=1,809,984,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9428/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,810,176,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9429/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,810,368,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9430/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=1,810,560,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9431/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=1,810,752,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9432/500000] + train/ActionNoiseL2Loss=0.0772 + throughput/total_tokens=1,810,944,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9433/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=1,811,136,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9434/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=1,811,328,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9435/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,811,520,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9436/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,811,712,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9437/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=1,811,904,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9438/500000] + train/ActionNoiseL2Loss=0.0335 + throughput/total_tokens=1,812,096,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9439/500000] + train/ActionNoiseL2Loss=0.0267 + throughput/total_tokens=1,812,288,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9440/500000] + optim/total_grad_norm=1.411 + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=1,812,480,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9441/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=1,812,672,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9442/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,812,864,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9443/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,813,056,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9444/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=1,813,248,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9445/500000] + train/ActionNoiseL2Loss=0.0210 + throughput/total_tokens=1,813,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9446/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=1,813,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9447/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,813,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9448/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=1,814,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9449/500000] + train/ActionNoiseL2Loss=0.1080 + throughput/total_tokens=1,814,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9450/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,814,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9451/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=1,814,592,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9452/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,814,784,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9453/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,814,976,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9454/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=1,815,168,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9455/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,815,360,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9456/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,815,552,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9457/500000] + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=1,815,744,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9458/500000] + train/ActionNoiseL2Loss=0.1050 + throughput/total_tokens=1,815,936,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9459/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=1,816,128,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9460/500000] + optim/total_grad_norm=1.293 + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,816,320,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=9461/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=1,816,512,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9462/500000] + train/ActionNoiseL2Loss=0.0340 + throughput/total_tokens=1,816,704,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9463/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=1,816,896,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9464/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=1,817,088,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9465/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=1,817,280,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9466/500000] + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=1,817,472,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9467/500000] + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=1,817,664,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9468/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=1,817,856,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9469/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,818,048,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9470/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=1,818,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9471/500000] + train/ActionNoiseL2Loss=0.0361 + throughput/total_tokens=1,818,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9472/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,818,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9473/500000] + train/ActionNoiseL2Loss=0.0886 + throughput/total_tokens=1,818,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9474/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,819,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9475/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=1,819,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9476/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=1,819,392,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9477/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,819,584,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9478/500000] + train/ActionNoiseL2Loss=0.0832 + throughput/total_tokens=1,819,776,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9479/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=1,819,968,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9480/500000] + optim/total_grad_norm=1.390 + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=1,820,160,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9481/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=1,820,352,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9482/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=1,820,544,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9483/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=1,820,736,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9484/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=1,820,928,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9485/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=1,821,120,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9486/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,821,312,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9487/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=1,821,504,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9488/500000] + train/ActionNoiseL2Loss=0.0238 + throughput/total_tokens=1,821,696,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9489/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=1,821,888,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9490/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,822,080,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9491/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=1,822,272,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9492/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,822,464,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9493/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,822,656,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9494/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=1,822,848,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9495/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=1,823,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9496/500000] + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=1,823,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9497/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=1,823,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9498/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=1,823,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9499/500000] + train/ActionNoiseL2Loss=0.0845 + throughput/total_tokens=1,823,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9500/500000] + optim/total_grad_norm=1.175 + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,824,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +10/08 [00:59:35] INFO | >> Saving config... checkpoint.py:608 +10/08 [01:00:30] INFO | >> Saving model state... checkpoint.py:796 +10/08 [01:01:46] INFO | >> Saving optim state... checkpoint.py:811 +10/08 [01:03:18] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=9501/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=1,824,192,000 + throughput/device/tokens_per_second=1,193 + throughput/device/batches_per_second=0.0497 +[step=9502/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,824,384,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9503/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=1,824,576,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=9504/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,824,768,000 + throughput/device/tokens_per_second=1,165 + throughput/device/batches_per_second=0.0486 +[step=9505/500000] + train/ActionNoiseL2Loss=0.1024 + throughput/total_tokens=1,824,960,000 + throughput/device/tokens_per_second=1,164 + throughput/device/batches_per_second=0.0485 +[step=9506/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=1,825,152,000 + throughput/device/tokens_per_second=1,163 + throughput/device/batches_per_second=0.0485 +[step=9507/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,825,344,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0485 +[step=9508/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=1,825,536,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=9509/500000] + train/ActionNoiseL2Loss=0.1331 + throughput/total_tokens=1,825,728,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=9510/500000] + train/ActionNoiseL2Loss=0.0228 + throughput/total_tokens=1,825,920,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9511/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=1,826,112,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9512/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,826,304,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9513/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=1,826,496,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9514/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,826,688,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9515/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,826,880,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9516/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,827,072,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9517/500000] + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=1,827,264,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9518/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=1,827,456,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9519/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,827,648,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9520/500000] + optim/total_grad_norm=1.712 + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=1,827,840,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9521/500000] + train/ActionNoiseL2Loss=0.1168 + throughput/total_tokens=1,828,032,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9522/500000] + train/ActionNoiseL2Loss=0.0273 + throughput/total_tokens=1,828,224,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9523/500000] + train/ActionNoiseL2Loss=0.0190 + throughput/total_tokens=1,828,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9524/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=1,828,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9525/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,828,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9526/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,828,992,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9527/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,829,184,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9528/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,829,376,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9529/500000] + train/ActionNoiseL2Loss=0.1126 + throughput/total_tokens=1,829,568,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9530/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=1,829,760,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9531/500000] + train/ActionNoiseL2Loss=0.0211 + throughput/total_tokens=1,829,952,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9532/500000] + train/ActionNoiseL2Loss=0.0949 + throughput/total_tokens=1,830,144,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9533/500000] + train/ActionNoiseL2Loss=0.0391 + throughput/total_tokens=1,830,336,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9534/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,830,528,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9535/500000] + train/ActionNoiseL2Loss=0.0838 + throughput/total_tokens=1,830,720,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9536/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,830,912,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9537/500000] + train/ActionNoiseL2Loss=0.0287 + throughput/total_tokens=1,831,104,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9538/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=1,831,296,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9539/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=1,831,488,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9540/500000] + optim/total_grad_norm=1.703 + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,831,680,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=9541/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,831,872,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9542/500000] + train/ActionNoiseL2Loss=0.0411 + throughput/total_tokens=1,832,064,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9543/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,832,256,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9544/500000] + train/ActionNoiseL2Loss=0.0932 + throughput/total_tokens=1,832,448,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9545/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,832,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9546/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,832,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9547/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=1,833,024,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9548/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,833,216,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9549/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=1,833,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9550/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=1,833,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9551/500000] + train/ActionNoiseL2Loss=0.0306 + throughput/total_tokens=1,833,792,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9552/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=1,833,984,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9553/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,834,176,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9554/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=1,834,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9555/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=1,834,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9556/500000] + train/ActionNoiseL2Loss=0.0297 + throughput/total_tokens=1,834,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9557/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=1,834,944,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9558/500000] + train/ActionNoiseL2Loss=0.0264 + throughput/total_tokens=1,835,136,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9559/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=1,835,328,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9560/500000] + optim/total_grad_norm=1.197 + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=1,835,520,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9561/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=1,835,712,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9562/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=1,835,904,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9563/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,836,096,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9564/500000] + train/ActionNoiseL2Loss=0.0911 + throughput/total_tokens=1,836,288,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9565/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=1,836,480,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9566/500000] + train/ActionNoiseL2Loss=0.0408 + throughput/total_tokens=1,836,672,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9567/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,836,864,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9568/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=1,837,056,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9569/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,837,248,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9570/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=1,837,440,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9571/500000] + train/ActionNoiseL2Loss=0.0335 + throughput/total_tokens=1,837,632,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9572/500000] + train/ActionNoiseL2Loss=0.0280 + throughput/total_tokens=1,837,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9573/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,838,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9574/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=1,838,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9575/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=1,838,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9576/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,838,592,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9577/500000] + train/ActionNoiseL2Loss=0.0237 + throughput/total_tokens=1,838,784,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9578/500000] + train/ActionNoiseL2Loss=0.0197 + throughput/total_tokens=1,838,976,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9579/500000] + train/ActionNoiseL2Loss=0.0178 + throughput/total_tokens=1,839,168,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9580/500000] + optim/total_grad_norm=1.344 + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,839,360,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9581/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=1,839,552,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9582/500000] + train/ActionNoiseL2Loss=0.0359 + throughput/total_tokens=1,839,744,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9583/500000] + train/ActionNoiseL2Loss=0.0980 + throughput/total_tokens=1,839,936,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9584/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=1,840,128,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9585/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=1,840,320,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9586/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,840,512,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9587/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=1,840,704,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9588/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,840,896,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9589/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=1,841,088,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9590/500000] + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=1,841,280,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9591/500000] + train/ActionNoiseL2Loss=0.0866 + throughput/total_tokens=1,841,472,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9592/500000] + train/ActionNoiseL2Loss=0.0312 + throughput/total_tokens=1,841,664,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9593/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=1,841,856,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9594/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=1,842,048,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9595/500000] + train/ActionNoiseL2Loss=0.0262 + throughput/total_tokens=1,842,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9596/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,842,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9597/500000] + train/ActionNoiseL2Loss=0.0877 + throughput/total_tokens=1,842,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9598/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=1,842,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9599/500000] + train/ActionNoiseL2Loss=0.0941 + throughput/total_tokens=1,843,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9600/500000] + optim/total_grad_norm=1.344 + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=1,843,200,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9601/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=1,843,392,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=9602/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=1,843,584,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=9603/500000] + train/ActionNoiseL2Loss=0.0843 + throughput/total_tokens=1,843,776,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=9604/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=1,843,968,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=9605/500000] + train/ActionNoiseL2Loss=0.0282 + throughput/total_tokens=1,844,160,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=9606/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,844,352,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=9607/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=1,844,544,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=9608/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=1,844,736,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=9609/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,844,928,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=9610/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=1,845,120,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,467 +[step=9611/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,845,312,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=9612/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=1,845,504,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=9613/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=1,845,696,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=9614/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=1,845,888,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=9615/500000] + train/ActionNoiseL2Loss=0.0924 + throughput/total_tokens=1,846,080,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=9616/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,846,272,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=9617/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,846,464,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=9618/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,846,656,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=9619/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,846,848,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=9620/500000] + optim/total_grad_norm=1.300 + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=1,847,040,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9621/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=1,847,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9622/500000] + train/ActionNoiseL2Loss=0.1171 + throughput/total_tokens=1,847,424,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9623/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=1,847,616,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9624/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,847,808,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9625/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,848,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9626/500000] + train/ActionNoiseL2Loss=0.0387 + throughput/total_tokens=1,848,192,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9627/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,848,384,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9628/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,848,576,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9629/500000] + train/ActionNoiseL2Loss=0.0340 + throughput/total_tokens=1,848,768,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9630/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,848,960,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9631/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=1,849,152,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9632/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,849,344,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9633/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=1,849,536,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9634/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,849,728,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9635/500000] + train/ActionNoiseL2Loss=0.0278 + throughput/total_tokens=1,849,920,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9636/500000] + train/ActionNoiseL2Loss=0.0269 + throughput/total_tokens=1,850,112,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9637/500000] + train/ActionNoiseL2Loss=0.0195 + throughput/total_tokens=1,850,304,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9638/500000] + train/ActionNoiseL2Loss=0.1385 + throughput/total_tokens=1,850,496,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9639/500000] + train/ActionNoiseL2Loss=0.0345 + throughput/total_tokens=1,850,688,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9640/500000] + optim/total_grad_norm=1.589 + train/ActionNoiseL2Loss=0.0951 + throughput/total_tokens=1,850,880,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9641/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=1,851,072,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9642/500000] + train/ActionNoiseL2Loss=0.1131 + throughput/total_tokens=1,851,264,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9643/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=1,851,456,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9644/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=1,851,648,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9645/500000] + train/ActionNoiseL2Loss=0.0189 + throughput/total_tokens=1,851,840,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9646/500000] + train/ActionNoiseL2Loss=0.0339 + throughput/total_tokens=1,852,032,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9647/500000] + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=1,852,224,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9648/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=1,852,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9649/500000] + train/ActionNoiseL2Loss=0.0788 + throughput/total_tokens=1,852,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9650/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,852,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9651/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,852,992,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9652/500000] + train/ActionNoiseL2Loss=0.0214 + throughput/total_tokens=1,853,184,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9653/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=1,853,376,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9654/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=1,853,568,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9655/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=1,853,760,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9656/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,853,952,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9657/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,854,144,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9658/500000] + train/ActionNoiseL2Loss=0.0980 + throughput/total_tokens=1,854,336,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9659/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=1,854,528,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9660/500000] + optim/total_grad_norm=1.510 + train/ActionNoiseL2Loss=0.1021 + throughput/total_tokens=1,854,720,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=9661/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,854,912,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9662/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=1,855,104,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9663/500000] + train/ActionNoiseL2Loss=0.1012 + throughput/total_tokens=1,855,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9664/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,855,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9665/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=1,855,680,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9666/500000] + train/ActionNoiseL2Loss=0.0332 + throughput/total_tokens=1,855,872,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9667/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,856,064,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9668/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=1,856,256,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9669/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,856,448,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9670/500000] + train/ActionNoiseL2Loss=0.0238 + throughput/total_tokens=1,856,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9671/500000] + train/ActionNoiseL2Loss=0.0314 + throughput/total_tokens=1,856,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9672/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,857,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9673/500000] + train/ActionNoiseL2Loss=0.0296 + throughput/total_tokens=1,857,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9674/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,857,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9675/500000] + train/ActionNoiseL2Loss=0.0244 + throughput/total_tokens=1,857,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9676/500000] + train/ActionNoiseL2Loss=0.0411 + throughput/total_tokens=1,857,792,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9677/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,857,984,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9678/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=1,858,176,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9679/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=1,858,368,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9680/500000] + optim/total_grad_norm=0.9323 + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=1,858,560,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9681/500000] + train/ActionNoiseL2Loss=0.0267 + throughput/total_tokens=1,858,752,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9682/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=1,858,944,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9683/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=1,859,136,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9684/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,859,328,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9685/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=1,859,520,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9686/500000] + train/ActionNoiseL2Loss=0.0270 + throughput/total_tokens=1,859,712,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9687/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,859,904,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9688/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=1,860,096,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9689/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=1,860,288,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9690/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,860,480,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9691/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,860,672,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9692/500000] + train/ActionNoiseL2Loss=0.0275 + throughput/total_tokens=1,860,864,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9693/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,861,056,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9694/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=1,861,248,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9695/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=1,861,440,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9696/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,861,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9697/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,861,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9698/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,862,016,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9699/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,862,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9700/500000] + optim/total_grad_norm=1.967 + train/ActionNoiseL2Loss=0.1144 + throughput/total_tokens=1,862,400,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9701/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,862,592,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9702/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=1,862,784,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9703/500000] + train/ActionNoiseL2Loss=0.0925 + throughput/total_tokens=1,862,976,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9704/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,863,168,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9705/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=1,863,360,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9706/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=1,863,552,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9707/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,863,744,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=9708/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,863,936,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=9709/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=1,864,128,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=9710/500000] + train/ActionNoiseL2Loss=0.0345 + throughput/total_tokens=1,864,320,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=9711/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=1,864,512,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=9712/500000] + train/ActionNoiseL2Loss=0.1196 + throughput/total_tokens=1,864,704,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=9713/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=1,864,896,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=9714/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=1,865,088,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=9715/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,865,280,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=9716/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,865,472,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=9717/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,865,664,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=9718/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,865,856,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=9719/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=1,866,048,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9720/500000] + optim/total_grad_norm=0.8367 + train/ActionNoiseL2Loss=0.0239 + throughput/total_tokens=1,866,240,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9721/500000] + train/ActionNoiseL2Loss=0.0929 + throughput/total_tokens=1,866,432,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9722/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=1,866,624,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9723/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=1,866,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9724/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=1,867,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9725/500000] + train/ActionNoiseL2Loss=0.0359 + throughput/total_tokens=1,867,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9726/500000] + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=1,867,392,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9727/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,867,584,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9728/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=1,867,776,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9729/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,867,968,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9730/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,868,160,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9731/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=1,868,352,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9732/500000] + train/ActionNoiseL2Loss=0.0709 + throughput/total_tokens=1,868,544,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9733/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,868,736,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9734/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=1,868,928,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9735/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=1,869,120,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9736/500000] + train/ActionNoiseL2Loss=0.0898 + throughput/total_tokens=1,869,312,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9737/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,869,504,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9738/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,869,696,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9739/500000] + train/ActionNoiseL2Loss=0.0281 + throughput/total_tokens=1,869,888,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9740/500000] + optim/total_grad_norm=0.9708 + train/ActionNoiseL2Loss=0.0185 + throughput/total_tokens=1,870,080,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9741/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=1,870,272,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9742/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=1,870,464,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9743/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=1,870,656,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9744/500000] + train/ActionNoiseL2Loss=0.0329 + throughput/total_tokens=1,870,848,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9745/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,871,040,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9746/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=1,871,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9747/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=1,871,424,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9748/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=1,871,616,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9749/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,871,808,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9750/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,872,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9751/500000] + train/ActionNoiseL2Loss=0.1236 + throughput/total_tokens=1,872,192,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9752/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=1,872,384,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9753/500000] + train/ActionNoiseL2Loss=0.1601 + throughput/total_tokens=1,872,576,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9754/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=1,872,768,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9755/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=1,872,960,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9756/500000] + train/ActionNoiseL2Loss=0.0337 + throughput/total_tokens=1,873,152,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9757/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,873,344,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9758/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=1,873,536,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9759/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=1,873,728,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9760/500000] + optim/total_grad_norm=1.460 + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=1,873,920,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=9761/500000] + train/ActionNoiseL2Loss=0.0314 + throughput/total_tokens=1,874,112,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9762/500000] + train/ActionNoiseL2Loss=0.0305 + throughput/total_tokens=1,874,304,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9763/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,874,496,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9764/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,874,688,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9765/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,874,880,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9766/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,875,072,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9767/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=1,875,264,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9768/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,875,456,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9769/500000] + train/ActionNoiseL2Loss=0.0240 + throughput/total_tokens=1,875,648,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9770/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,875,840,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9771/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,876,032,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9772/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,876,224,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9773/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=1,876,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9774/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=1,876,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9775/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=1,876,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9776/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=1,876,992,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9777/500000] + train/ActionNoiseL2Loss=0.0902 + throughput/total_tokens=1,877,184,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9778/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,877,376,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9779/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,877,568,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9780/500000] + optim/total_grad_norm=1.264 + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,877,760,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9781/500000] + train/ActionNoiseL2Loss=0.0338 + throughput/total_tokens=1,877,952,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9782/500000] + train/ActionNoiseL2Loss=0.0941 + throughput/total_tokens=1,878,144,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9783/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=1,878,336,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9784/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,878,528,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9785/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,878,720,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9786/500000] + train/ActionNoiseL2Loss=0.0324 + throughput/total_tokens=1,878,912,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9787/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,879,104,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9788/500000] + train/ActionNoiseL2Loss=0.0899 + throughput/total_tokens=1,879,296,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9789/500000] + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=1,879,488,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9790/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,879,680,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9791/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=1,879,872,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9792/500000] + train/ActionNoiseL2Loss=0.0297 + throughput/total_tokens=1,880,064,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9793/500000] + train/ActionNoiseL2Loss=0.0280 + throughput/total_tokens=1,880,256,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9794/500000] + train/ActionNoiseL2Loss=0.0276 + throughput/total_tokens=1,880,448,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9795/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,880,640,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9796/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=1,880,832,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9797/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,881,024,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9798/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,881,216,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9799/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=1,881,408,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9800/500000] + optim/total_grad_norm=1.423 + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=1,881,600,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9801/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=1,881,792,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9802/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=1,881,984,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9803/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,882,176,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9804/500000] + train/ActionNoiseL2Loss=0.0309 + throughput/total_tokens=1,882,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9805/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,882,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9806/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,882,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9807/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,882,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9808/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,883,136,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9809/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=1,883,328,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9810/500000] + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=1,883,520,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=9811/500000] + train/ActionNoiseL2Loss=0.0312 + throughput/total_tokens=1,883,712,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9812/500000] + train/ActionNoiseL2Loss=0.0310 + throughput/total_tokens=1,883,904,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9813/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=1,884,096,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9814/500000] + train/ActionNoiseL2Loss=0.0338 + throughput/total_tokens=1,884,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9815/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=1,884,480,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9816/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=1,884,672,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9817/500000] + train/ActionNoiseL2Loss=0.0233 + throughput/total_tokens=1,884,864,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9818/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=1,885,056,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9819/500000] + train/ActionNoiseL2Loss=0.0253 + throughput/total_tokens=1,885,248,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9820/500000] + optim/total_grad_norm=1.095 + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=1,885,440,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9821/500000] + train/ActionNoiseL2Loss=0.0316 + throughput/total_tokens=1,885,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9822/500000] + train/ActionNoiseL2Loss=0.1543 + throughput/total_tokens=1,885,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9823/500000] + train/ActionNoiseL2Loss=0.0838 + throughput/total_tokens=1,886,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9824/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,886,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9825/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,886,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9826/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,886,592,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9827/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=1,886,784,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9828/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,886,976,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9829/500000] + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=1,887,168,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9830/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=1,887,360,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9831/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=1,887,552,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9832/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=1,887,744,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9833/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,887,936,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9834/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=1,888,128,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9835/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,888,320,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9836/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,888,512,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9837/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,888,704,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9838/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=1,888,896,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9839/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=1,889,088,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9840/500000] + optim/total_grad_norm=1.487 + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,889,280,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9841/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,889,472,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9842/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,889,664,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9843/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,889,856,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9844/500000] + train/ActionNoiseL2Loss=0.1225 + throughput/total_tokens=1,890,048,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9845/500000] + train/ActionNoiseL2Loss=0.0264 + throughput/total_tokens=1,890,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9846/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=1,890,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9847/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,890,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9848/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,890,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9849/500000] + train/ActionNoiseL2Loss=0.0941 + throughput/total_tokens=1,891,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9850/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,891,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9851/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=1,891,392,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9852/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=1,891,584,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9853/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=1,891,776,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9854/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=1,891,968,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9855/500000] + train/ActionNoiseL2Loss=0.0306 + throughput/total_tokens=1,892,160,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9856/500000] + train/ActionNoiseL2Loss=0.0900 + throughput/total_tokens=1,892,352,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9857/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,892,544,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9858/500000] + train/ActionNoiseL2Loss=0.0239 + throughput/total_tokens=1,892,736,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9859/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=1,892,928,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9860/500000] + optim/total_grad_norm=0.9671 + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,893,120,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=9861/500000] + train/ActionNoiseL2Loss=0.0212 + throughput/total_tokens=1,893,312,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9862/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=1,893,504,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9863/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=1,893,696,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9864/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,893,888,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9865/500000] + train/ActionNoiseL2Loss=0.0296 + throughput/total_tokens=1,894,080,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9866/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,894,272,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9867/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=1,894,464,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9868/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=1,894,656,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9869/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,894,848,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=9870/500000] + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=1,895,040,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9871/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=1,895,232,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9872/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=1,895,424,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9873/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,895,616,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9874/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=1,895,808,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9875/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=1,896,000,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9876/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=1,896,192,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9877/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,896,384,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9878/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=1,896,576,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9879/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,896,768,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9880/500000] + optim/total_grad_norm=1.345 + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,896,960,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9881/500000] + train/ActionNoiseL2Loss=0.0301 + throughput/total_tokens=1,897,152,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9882/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,897,344,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9883/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,897,536,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9884/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=1,897,728,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9885/500000] + train/ActionNoiseL2Loss=0.0330 + throughput/total_tokens=1,897,920,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9886/500000] + train/ActionNoiseL2Loss=0.0303 + throughput/total_tokens=1,898,112,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9887/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,898,304,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9888/500000] + train/ActionNoiseL2Loss=0.0276 + throughput/total_tokens=1,898,496,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9889/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,898,688,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9890/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=1,898,880,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9891/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,899,072,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9892/500000] + train/ActionNoiseL2Loss=0.0318 + throughput/total_tokens=1,899,264,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9893/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=1,899,456,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9894/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=1,899,648,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9895/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=1,899,840,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9896/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,900,032,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9897/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,900,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9898/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,900,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9899/500000] + train/ActionNoiseL2Loss=0.0263 + throughput/total_tokens=1,900,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9900/500000] + optim/total_grad_norm=1.029 + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,900,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9901/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,900,992,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9902/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,901,184,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=9903/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=1,901,376,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9904/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=1,901,568,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9905/500000] + train/ActionNoiseL2Loss=0.0247 + throughput/total_tokens=1,901,760,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9906/500000] + train/ActionNoiseL2Loss=0.0297 + throughput/total_tokens=1,901,952,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9907/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=1,902,144,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9908/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=1,902,336,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9909/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,902,528,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9910/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=1,902,720,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=9911/500000] + train/ActionNoiseL2Loss=0.0233 + throughput/total_tokens=1,902,912,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9912/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=1,903,104,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9913/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=1,903,296,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9914/500000] + train/ActionNoiseL2Loss=0.0325 + throughput/total_tokens=1,903,488,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9915/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=1,903,680,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9916/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=1,903,872,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9917/500000] + train/ActionNoiseL2Loss=0.0305 + throughput/total_tokens=1,904,064,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9918/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=1,904,256,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9919/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,904,448,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9920/500000] + optim/total_grad_norm=1.114 + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=1,904,640,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9921/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,904,832,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9922/500000] + train/ActionNoiseL2Loss=0.0277 + throughput/total_tokens=1,905,024,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9923/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=1,905,216,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9924/500000] + train/ActionNoiseL2Loss=0.0325 + throughput/total_tokens=1,905,408,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9925/500000] + train/ActionNoiseL2Loss=0.1243 + throughput/total_tokens=1,905,600,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9926/500000] + train/ActionNoiseL2Loss=0.0192 + throughput/total_tokens=1,905,792,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9927/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=1,905,984,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9928/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,906,176,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9929/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,906,368,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9930/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,906,560,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9931/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,906,752,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9932/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,906,944,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9933/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,907,136,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9934/500000] + train/ActionNoiseL2Loss=0.1080 + throughput/total_tokens=1,907,328,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9935/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=1,907,520,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9936/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=1,907,712,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9937/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=1,907,904,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9938/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=1,908,096,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9939/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,908,288,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9940/500000] + optim/total_grad_norm=0.8410 + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=1,908,480,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=9941/500000] + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=1,908,672,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=9942/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,908,864,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9943/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=1,909,056,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9944/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,909,248,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9945/500000] + train/ActionNoiseL2Loss=0.0752 + throughput/total_tokens=1,909,440,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9946/500000] + train/ActionNoiseL2Loss=0.0282 + throughput/total_tokens=1,909,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9947/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=1,909,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=9948/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=1,910,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9949/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=1,910,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9950/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,910,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9951/500000] + train/ActionNoiseL2Loss=0.0272 + throughput/total_tokens=1,910,592,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9952/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,910,784,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9953/500000] + train/ActionNoiseL2Loss=0.0242 + throughput/total_tokens=1,910,976,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9954/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,911,168,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9955/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=1,911,360,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9956/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=1,911,552,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9957/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,911,744,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9958/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,911,936,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9959/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=1,912,128,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9960/500000] + optim/total_grad_norm=1.098 + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,912,320,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=9961/500000] + train/ActionNoiseL2Loss=0.0930 + throughput/total_tokens=1,912,512,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9962/500000] + train/ActionNoiseL2Loss=0.0339 + throughput/total_tokens=1,912,704,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9963/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=1,912,896,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9964/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=1,913,088,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9965/500000] + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=1,913,280,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9966/500000] + train/ActionNoiseL2Loss=0.1147 + throughput/total_tokens=1,913,472,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9967/500000] + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=1,913,664,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9968/500000] + train/ActionNoiseL2Loss=0.0408 + throughput/total_tokens=1,913,856,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9969/500000] + train/ActionNoiseL2Loss=0.0410 + throughput/total_tokens=1,914,048,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=9970/500000] + train/ActionNoiseL2Loss=0.0202 + throughput/total_tokens=1,914,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9971/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=1,914,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9972/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,914,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9973/500000] + train/ActionNoiseL2Loss=0.0318 + throughput/total_tokens=1,914,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=9974/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,915,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9975/500000] + train/ActionNoiseL2Loss=0.1127 + throughput/total_tokens=1,915,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9976/500000] + train/ActionNoiseL2Loss=0.0252 + throughput/total_tokens=1,915,392,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9977/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,915,584,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9978/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=1,915,776,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9979/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,915,968,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9980/500000] + optim/total_grad_norm=1.037 + train/ActionNoiseL2Loss=0.0285 + throughput/total_tokens=1,916,160,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9981/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,916,352,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9982/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=1,916,544,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9983/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=1,916,736,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9984/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,916,928,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9985/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=1,917,120,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9986/500000] + train/ActionNoiseL2Loss=0.0201 + throughput/total_tokens=1,917,312,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9987/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,917,504,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9988/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,917,696,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9989/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,917,888,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9990/500000] + train/ActionNoiseL2Loss=0.0253 + throughput/total_tokens=1,918,080,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=9991/500000] + train/ActionNoiseL2Loss=0.0197 + throughput/total_tokens=1,918,272,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9992/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,918,464,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9993/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,918,656,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9994/500000] + train/ActionNoiseL2Loss=0.0772 + throughput/total_tokens=1,918,848,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9995/500000] + train/ActionNoiseL2Loss=0.0315 + throughput/total_tokens=1,919,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9996/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,919,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9997/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=1,919,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9998/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=1,919,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=9999/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=1,919,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10000/500000] + optim/total_grad_norm=1.129 + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=1,920,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +10/08 [03:57:48] INFO | >> Saving config... checkpoint.py:608 +10/08 [03:58:22] INFO | >> Saving model state... checkpoint.py:796 +10/08 [03:59:38] INFO | >> Saving optim state... checkpoint.py:811 +10/08 [04:01:10] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=10001/500000] + train/ActionNoiseL2Loss=0.0189 + throughput/total_tokens=1,920,192,000 + throughput/device/tokens_per_second=1,189 + throughput/device/batches_per_second=0.0496 +[step=10002/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,920,384,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10003/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=1,920,576,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=10004/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=1,920,768,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10005/500000] + train/ActionNoiseL2Loss=0.0411 + throughput/total_tokens=1,920,960,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10006/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=1,921,152,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10007/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,921,344,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=10008/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=1,921,536,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=10009/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,921,728,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10010/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=1,921,920,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=10011/500000] + train/ActionNoiseL2Loss=0.0253 + throughput/total_tokens=1,922,112,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10012/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,922,304,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10013/500000] + train/ActionNoiseL2Loss=0.0223 + throughput/total_tokens=1,922,496,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10014/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=1,922,688,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10015/500000] + train/ActionNoiseL2Loss=0.0306 + throughput/total_tokens=1,922,880,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10016/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,923,072,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10017/500000] + train/ActionNoiseL2Loss=0.0408 + throughput/total_tokens=1,923,264,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10018/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,923,456,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10019/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=1,923,648,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10020/500000] + optim/total_grad_norm=1.130 + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,923,840,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=10021/500000] + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=1,924,032,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10022/500000] + train/ActionNoiseL2Loss=0.1078 + throughput/total_tokens=1,924,224,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10023/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=1,924,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10024/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,924,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10025/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=1,924,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10026/500000] + train/ActionNoiseL2Loss=0.0802 + throughput/total_tokens=1,924,992,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10027/500000] + train/ActionNoiseL2Loss=0.0164 + throughput/total_tokens=1,925,184,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10028/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=1,925,376,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10029/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=1,925,568,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10030/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,925,760,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10031/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,925,952,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10032/500000] + train/ActionNoiseL2Loss=0.0285 + throughput/total_tokens=1,926,144,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10033/500000] + train/ActionNoiseL2Loss=0.0177 + throughput/total_tokens=1,926,336,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10034/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=1,926,528,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10035/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,926,720,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10036/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=1,926,912,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10037/500000] + train/ActionNoiseL2Loss=0.1276 + throughput/total_tokens=1,927,104,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10038/500000] + train/ActionNoiseL2Loss=0.0345 + throughput/total_tokens=1,927,296,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10039/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,927,488,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10040/500000] + optim/total_grad_norm=1.299 + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,927,680,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10041/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,927,872,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10042/500000] + train/ActionNoiseL2Loss=0.1032 + throughput/total_tokens=1,928,064,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10043/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=1,928,256,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10044/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=1,928,448,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10045/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=1,928,640,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10046/500000] + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=1,928,832,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10047/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,929,024,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10048/500000] + train/ActionNoiseL2Loss=0.0874 + throughput/total_tokens=1,929,216,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10049/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=1,929,408,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10050/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,929,600,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10051/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,929,792,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10052/500000] + train/ActionNoiseL2Loss=0.1091 + throughput/total_tokens=1,929,984,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10053/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=1,930,176,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10054/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=1,930,368,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10055/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=1,930,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10056/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,930,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10057/500000] + train/ActionNoiseL2Loss=0.0191 + throughput/total_tokens=1,930,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10058/500000] + train/ActionNoiseL2Loss=0.0135 + throughput/total_tokens=1,931,136,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10059/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=1,931,328,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10060/500000] + optim/total_grad_norm=1.109 + train/ActionNoiseL2Loss=0.0325 + throughput/total_tokens=1,931,520,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10061/500000] + train/ActionNoiseL2Loss=0.1667 + throughput/total_tokens=1,931,712,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10062/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,931,904,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10063/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=1,932,096,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10064/500000] + train/ActionNoiseL2Loss=0.0361 + throughput/total_tokens=1,932,288,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10065/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,932,480,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10066/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,932,672,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10067/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,932,864,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10068/500000] + train/ActionNoiseL2Loss=0.0224 + throughput/total_tokens=1,933,056,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10069/500000] + train/ActionNoiseL2Loss=0.1056 + throughput/total_tokens=1,933,248,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10070/500000] + train/ActionNoiseL2Loss=0.0848 + throughput/total_tokens=1,933,440,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10071/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,933,632,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10072/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,933,824,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10073/500000] + train/ActionNoiseL2Loss=0.0200 + throughput/total_tokens=1,934,016,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10074/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=1,934,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10075/500000] + train/ActionNoiseL2Loss=0.0282 + throughput/total_tokens=1,934,400,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10076/500000] + train/ActionNoiseL2Loss=0.0308 + throughput/total_tokens=1,934,592,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10077/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,934,784,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10078/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=1,934,976,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10079/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,935,168,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10080/500000] + optim/total_grad_norm=1.229 + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=1,935,360,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10081/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=1,935,552,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10082/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,935,744,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10083/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,935,936,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10084/500000] + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=1,936,128,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10085/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,936,320,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10086/500000] + train/ActionNoiseL2Loss=0.0958 + throughput/total_tokens=1,936,512,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10087/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,936,704,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10088/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=1,936,896,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10089/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=1,937,088,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10090/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=1,937,280,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10091/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=1,937,472,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10092/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,937,664,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10093/500000] + train/ActionNoiseL2Loss=0.0359 + throughput/total_tokens=1,937,856,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10094/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,938,048,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10095/500000] + train/ActionNoiseL2Loss=0.0273 + throughput/total_tokens=1,938,240,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10096/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=1,938,432,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10097/500000] + train/ActionNoiseL2Loss=0.0318 + throughput/total_tokens=1,938,624,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10098/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,938,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10099/500000] + train/ActionNoiseL2Loss=0.1046 + throughput/total_tokens=1,939,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10100/500000] + optim/total_grad_norm=0.9410 + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,939,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10101/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,939,392,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10102/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,939,584,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10103/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,939,776,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10104/500000] + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=1,939,968,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10105/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=1,940,160,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10106/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,940,352,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10107/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=1,940,544,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10108/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=1,940,736,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10109/500000] + train/ActionNoiseL2Loss=0.0284 + throughput/total_tokens=1,940,928,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10110/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,941,120,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10111/500000] + train/ActionNoiseL2Loss=0.0239 + throughput/total_tokens=1,941,312,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10112/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,941,504,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10113/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,941,696,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10114/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,941,888,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10115/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,942,080,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10116/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,942,272,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10117/500000] + train/ActionNoiseL2Loss=0.0901 + throughput/total_tokens=1,942,464,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10118/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,942,656,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10119/500000] + train/ActionNoiseL2Loss=0.0335 + throughput/total_tokens=1,942,848,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10120/500000] + optim/total_grad_norm=1.164 + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,943,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10121/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,943,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10122/500000] + train/ActionNoiseL2Loss=0.1062 + throughput/total_tokens=1,943,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10123/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=1,943,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10124/500000] + train/ActionNoiseL2Loss=0.0876 + throughput/total_tokens=1,943,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10125/500000] + train/ActionNoiseL2Loss=0.0265 + throughput/total_tokens=1,944,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10126/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=1,944,192,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10127/500000] + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=1,944,384,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10128/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,944,576,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10129/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=1,944,768,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10130/500000] + train/ActionNoiseL2Loss=0.0691 + throughput/total_tokens=1,944,960,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10131/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=1,945,152,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10132/500000] + train/ActionNoiseL2Loss=0.0313 + throughput/total_tokens=1,945,344,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10133/500000] + train/ActionNoiseL2Loss=0.0332 + throughput/total_tokens=1,945,536,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10134/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=1,945,728,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10135/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=1,945,920,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10136/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,946,112,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10137/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=1,946,304,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10138/500000] + train/ActionNoiseL2Loss=0.1385 + throughput/total_tokens=1,946,496,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10139/500000] + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=1,946,688,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10140/500000] + optim/total_grad_norm=0.9374 + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,946,880,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10141/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=1,947,072,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10142/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,947,264,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10143/500000] + train/ActionNoiseL2Loss=0.0243 + throughput/total_tokens=1,947,456,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10144/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=1,947,648,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10145/500000] + train/ActionNoiseL2Loss=0.0324 + throughput/total_tokens=1,947,840,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10146/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,948,032,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10147/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,948,224,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10148/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=1,948,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10149/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,948,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10150/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=1,948,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10151/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,948,992,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10152/500000] + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=1,949,184,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10153/500000] + train/ActionNoiseL2Loss=0.0270 + throughput/total_tokens=1,949,376,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10154/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=1,949,568,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10155/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=1,949,760,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10156/500000] + train/ActionNoiseL2Loss=0.0268 + throughput/total_tokens=1,949,952,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10157/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=1,950,144,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10158/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,950,336,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10159/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,950,528,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10160/500000] + optim/total_grad_norm=0.9746 + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=1,950,720,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10161/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,950,912,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10162/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,951,104,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10163/500000] + train/ActionNoiseL2Loss=0.0280 + throughput/total_tokens=1,951,296,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10164/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,951,488,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10165/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=1,951,680,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10166/500000] + train/ActionNoiseL2Loss=0.0776 + throughput/total_tokens=1,951,872,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10167/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=1,952,064,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10168/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,952,256,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10169/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,952,448,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10170/500000] + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=1,952,640,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10171/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,952,832,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10172/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=1,953,024,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10173/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=1,953,216,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10174/500000] + train/ActionNoiseL2Loss=0.0294 + throughput/total_tokens=1,953,408,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10175/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,953,600,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10176/500000] + train/ActionNoiseL2Loss=0.1119 + throughput/total_tokens=1,953,792,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10177/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,953,984,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10178/500000] + train/ActionNoiseL2Loss=0.0939 + throughput/total_tokens=1,954,176,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10179/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,954,368,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10180/500000] + optim/total_grad_norm=0.9883 + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=1,954,560,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10181/500000] + train/ActionNoiseL2Loss=0.0264 + throughput/total_tokens=1,954,752,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10182/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=1,954,944,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10183/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=1,955,136,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10184/500000] + train/ActionNoiseL2Loss=0.0187 + throughput/total_tokens=1,955,328,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10185/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,955,520,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10186/500000] + train/ActionNoiseL2Loss=0.0171 + throughput/total_tokens=1,955,712,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10187/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=1,955,904,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10188/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,956,096,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10189/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,956,288,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10190/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,956,480,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10191/500000] + train/ActionNoiseL2Loss=0.0224 + throughput/total_tokens=1,956,672,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10192/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,956,864,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10193/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=1,957,056,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10194/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,957,248,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10195/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=1,957,440,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10196/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=1,957,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10197/500000] + train/ActionNoiseL2Loss=0.0906 + throughput/total_tokens=1,957,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10198/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=1,958,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10199/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=1,958,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10200/500000] + optim/total_grad_norm=1.161 + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,958,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10201/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=1,958,592,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10202/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,958,784,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10203/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=1,958,976,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10204/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,959,168,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10205/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=1,959,360,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10206/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=1,959,552,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10207/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=1,959,744,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10208/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=1,959,936,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10209/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,960,128,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10210/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=1,960,320,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10211/500000] + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=1,960,512,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10212/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=1,960,704,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10213/500000] + train/ActionNoiseL2Loss=0.1061 + throughput/total_tokens=1,960,896,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10214/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,961,088,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10215/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,961,280,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10216/500000] + train/ActionNoiseL2Loss=0.1077 + throughput/total_tokens=1,961,472,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10217/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,961,664,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10218/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=1,961,856,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10219/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=1,962,048,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10220/500000] + optim/total_grad_norm=1.160 + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=1,962,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10221/500000] + train/ActionNoiseL2Loss=0.0271 + throughput/total_tokens=1,962,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10222/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=1,962,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10223/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=1,962,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10224/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=1,963,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10225/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=1,963,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10226/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,963,392,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10227/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,963,584,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10228/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=1,963,776,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10229/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=1,963,968,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10230/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=1,964,160,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10231/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,964,352,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10232/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=1,964,544,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10233/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=1,964,736,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10234/500000] + train/ActionNoiseL2Loss=0.0308 + throughput/total_tokens=1,964,928,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10235/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=1,965,120,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10236/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,965,312,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10237/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,965,504,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10238/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=1,965,696,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10239/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=1,965,888,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10240/500000] + optim/total_grad_norm=0.9461 + train/ActionNoiseL2Loss=0.0324 + throughput/total_tokens=1,966,080,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10241/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=1,966,272,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10242/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=1,966,464,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10243/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=1,966,656,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10244/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=1,966,848,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10245/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=1,967,040,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10246/500000] + train/ActionNoiseL2Loss=0.0849 + throughput/total_tokens=1,967,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10247/500000] + train/ActionNoiseL2Loss=0.0314 + throughput/total_tokens=1,967,424,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10248/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=1,967,616,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10249/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=1,967,808,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10250/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=1,968,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10251/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=1,968,192,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10252/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=1,968,384,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10253/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,968,576,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10254/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=1,968,768,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10255/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,968,960,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10256/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,969,152,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10257/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=1,969,344,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10258/500000] + train/ActionNoiseL2Loss=0.0235 + throughput/total_tokens=1,969,536,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10259/500000] + train/ActionNoiseL2Loss=0.0252 + throughput/total_tokens=1,969,728,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10260/500000] + optim/total_grad_norm=0.8340 + train/ActionNoiseL2Loss=0.0226 + throughput/total_tokens=1,969,920,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10261/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,970,112,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10262/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=1,970,304,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10263/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,970,496,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10264/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,970,688,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10265/500000] + train/ActionNoiseL2Loss=0.0921 + throughput/total_tokens=1,970,880,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10266/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,971,072,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10267/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,971,264,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10268/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,971,456,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10269/500000] + train/ActionNoiseL2Loss=0.0923 + throughput/total_tokens=1,971,648,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10270/500000] + train/ActionNoiseL2Loss=0.0277 + throughput/total_tokens=1,971,840,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10271/500000] + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=1,972,032,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10272/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=1,972,224,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10273/500000] + train/ActionNoiseL2Loss=0.0833 + throughput/total_tokens=1,972,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10274/500000] + train/ActionNoiseL2Loss=0.0291 + throughput/total_tokens=1,972,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10275/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=1,972,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10276/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,972,992,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10277/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,973,184,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10278/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=1,973,376,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10279/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=1,973,568,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10280/500000] + optim/total_grad_norm=0.9998 + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,973,760,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10281/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,973,952,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10282/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=1,974,144,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10283/500000] + train/ActionNoiseL2Loss=0.0155 + throughput/total_tokens=1,974,336,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10284/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=1,974,528,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10285/500000] + train/ActionNoiseL2Loss=0.0359 + throughput/total_tokens=1,974,720,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10286/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,974,912,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10287/500000] + train/ActionNoiseL2Loss=0.1079 + throughput/total_tokens=1,975,104,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10288/500000] + train/ActionNoiseL2Loss=0.0308 + throughput/total_tokens=1,975,296,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10289/500000] + train/ActionNoiseL2Loss=0.0218 + throughput/total_tokens=1,975,488,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10290/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,975,680,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10291/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,975,872,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10292/500000] + train/ActionNoiseL2Loss=0.1752 + throughput/total_tokens=1,976,064,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10293/500000] + train/ActionNoiseL2Loss=0.0316 + throughput/total_tokens=1,976,256,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10294/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=1,976,448,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10295/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=1,976,640,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10296/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,976,832,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10297/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=1,977,024,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10298/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,977,216,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10299/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,977,408,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10300/500000] + optim/total_grad_norm=1.301 + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,977,600,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10301/500000] + train/ActionNoiseL2Loss=0.0313 + throughput/total_tokens=1,977,792,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10302/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=1,977,984,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10303/500000] + train/ActionNoiseL2Loss=0.1191 + throughput/total_tokens=1,978,176,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10304/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,978,368,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10305/500000] + train/ActionNoiseL2Loss=0.0330 + throughput/total_tokens=1,978,560,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10306/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,978,752,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10307/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=1,978,944,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10308/500000] + train/ActionNoiseL2Loss=0.1080 + throughput/total_tokens=1,979,136,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10309/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,979,328,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10310/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,979,520,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10311/500000] + train/ActionNoiseL2Loss=0.0992 + throughput/total_tokens=1,979,712,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10312/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=1,979,904,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10313/500000] + train/ActionNoiseL2Loss=0.0259 + throughput/total_tokens=1,980,096,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10314/500000] + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=1,980,288,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10315/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,980,480,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10316/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=1,980,672,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10317/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=1,980,864,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10318/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,981,056,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10319/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,981,248,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10320/500000] + optim/total_grad_norm=1.683 + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,981,440,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10321/500000] + train/ActionNoiseL2Loss=0.0923 + throughput/total_tokens=1,981,632,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10322/500000] + train/ActionNoiseL2Loss=0.0385 + throughput/total_tokens=1,981,824,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10323/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,982,016,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10324/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=1,982,208,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10325/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,982,400,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10326/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,982,592,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10327/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=1,982,784,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10328/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=1,982,976,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10329/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,983,168,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10330/500000] + train/ActionNoiseL2Loss=0.0256 + throughput/total_tokens=1,983,360,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10331/500000] + train/ActionNoiseL2Loss=0.0272 + throughput/total_tokens=1,983,552,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10332/500000] + train/ActionNoiseL2Loss=0.0179 + throughput/total_tokens=1,983,744,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10333/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=1,983,936,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10334/500000] + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=1,984,128,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10335/500000] + train/ActionNoiseL2Loss=0.0277 + throughput/total_tokens=1,984,320,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10336/500000] + train/ActionNoiseL2Loss=0.0212 + throughput/total_tokens=1,984,512,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10337/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=1,984,704,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10338/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=1,984,896,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10339/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=1,985,088,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10340/500000] + optim/total_grad_norm=1.031 + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=1,985,280,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10341/500000] + train/ActionNoiseL2Loss=0.0343 + throughput/total_tokens=1,985,472,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10342/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,985,664,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10343/500000] + train/ActionNoiseL2Loss=0.0959 + throughput/total_tokens=1,985,856,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10344/500000] + train/ActionNoiseL2Loss=0.0332 + throughput/total_tokens=1,986,048,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10345/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,986,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10346/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=1,986,432,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10347/500000] + train/ActionNoiseL2Loss=0.0338 + throughput/total_tokens=1,986,624,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10348/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=1,986,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10349/500000] + train/ActionNoiseL2Loss=0.0345 + throughput/total_tokens=1,987,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10350/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,987,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10351/500000] + train/ActionNoiseL2Loss=0.0868 + throughput/total_tokens=1,987,392,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10352/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,987,584,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10353/500000] + train/ActionNoiseL2Loss=0.1048 + throughput/total_tokens=1,987,776,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10354/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=1,987,968,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10355/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,988,160,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10356/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=1,988,352,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10357/500000] + train/ActionNoiseL2Loss=0.0904 + throughput/total_tokens=1,988,544,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10358/500000] + train/ActionNoiseL2Loss=0.0408 + throughput/total_tokens=1,988,736,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10359/500000] + train/ActionNoiseL2Loss=0.1221 + throughput/total_tokens=1,988,928,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10360/500000] + optim/total_grad_norm=1.011 + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,989,120,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10361/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,989,312,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10362/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=1,989,504,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10363/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=1,989,696,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10364/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=1,989,888,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10365/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=1,990,080,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10366/500000] + train/ActionNoiseL2Loss=0.1145 + throughput/total_tokens=1,990,272,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10367/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=1,990,464,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10368/500000] + train/ActionNoiseL2Loss=0.0263 + throughput/total_tokens=1,990,656,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10369/500000] + train/ActionNoiseL2Loss=0.0361 + throughput/total_tokens=1,990,848,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10370/500000] + train/ActionNoiseL2Loss=0.0337 + throughput/total_tokens=1,991,040,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10371/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=1,991,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10372/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,991,424,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10373/500000] + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=1,991,616,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10374/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,991,808,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10375/500000] + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=1,992,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10376/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,992,192,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10377/500000] + train/ActionNoiseL2Loss=0.0330 + throughput/total_tokens=1,992,384,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10378/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,992,576,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10379/500000] + train/ActionNoiseL2Loss=0.0284 + throughput/total_tokens=1,992,768,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10380/500000] + optim/total_grad_norm=1.635 + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=1,992,960,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10381/500000] + train/ActionNoiseL2Loss=0.0313 + throughput/total_tokens=1,993,152,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10382/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,993,344,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10383/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=1,993,536,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10384/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=1,993,728,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10385/500000] + train/ActionNoiseL2Loss=0.0267 + throughput/total_tokens=1,993,920,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10386/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,994,112,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10387/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=1,994,304,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10388/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=1,994,496,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10389/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,994,688,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10390/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,994,880,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10391/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,995,072,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10392/500000] + train/ActionNoiseL2Loss=0.0197 + throughput/total_tokens=1,995,264,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10393/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,995,456,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10394/500000] + train/ActionNoiseL2Loss=0.0329 + throughput/total_tokens=1,995,648,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10395/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=1,995,840,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10396/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=1,996,032,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10397/500000] + train/ActionNoiseL2Loss=0.0145 + throughput/total_tokens=1,996,224,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10398/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=1,996,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10399/500000] + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=1,996,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10400/500000] + optim/total_grad_norm=1.232 + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=1,996,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10401/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,996,992,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10402/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,997,184,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10403/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=1,997,376,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10404/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=1,997,568,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10405/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,997,760,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10406/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,997,952,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10407/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=1,998,144,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10408/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,998,336,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10409/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=1,998,528,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10410/500000] + train/ActionNoiseL2Loss=0.0391 + throughput/total_tokens=1,998,720,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10411/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=1,998,912,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10412/500000] + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=1,999,104,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10413/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,999,296,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10414/500000] + train/ActionNoiseL2Loss=0.0872 + throughput/total_tokens=1,999,488,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10415/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=1,999,680,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10416/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=1,999,872,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10417/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=2,000,064,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10418/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=2,000,256,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10419/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=2,000,448,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10420/500000] + optim/total_grad_norm=0.9981 + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=2,000,640,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10421/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=2,000,832,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10422/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=2,001,024,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10423/500000] + train/ActionNoiseL2Loss=0.0343 + throughput/total_tokens=2,001,216,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10424/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=2,001,408,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10425/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=2,001,600,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10426/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=2,001,792,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10427/500000] + train/ActionNoiseL2Loss=0.0282 + throughput/total_tokens=2,001,984,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10428/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=2,002,176,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10429/500000] + train/ActionNoiseL2Loss=0.0139 + throughput/total_tokens=2,002,368,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10430/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=2,002,560,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10431/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=2,002,752,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10432/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=2,002,944,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10433/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=2,003,136,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10434/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=2,003,328,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10435/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=2,003,520,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10436/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=2,003,712,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10437/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=2,003,904,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10438/500000] + train/ActionNoiseL2Loss=0.0255 + throughput/total_tokens=2,004,096,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10439/500000] + train/ActionNoiseL2Loss=0.1107 + throughput/total_tokens=2,004,288,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10440/500000] + optim/total_grad_norm=1.212 + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=2,004,480,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10441/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=2,004,672,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10442/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=2,004,864,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10443/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=2,005,056,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10444/500000] + train/ActionNoiseL2Loss=0.0291 + throughput/total_tokens=2,005,248,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10445/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=2,005,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10446/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=2,005,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10447/500000] + train/ActionNoiseL2Loss=0.0968 + throughput/total_tokens=2,005,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10448/500000] + train/ActionNoiseL2Loss=0.0245 + throughput/total_tokens=2,006,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10449/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=2,006,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10450/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=2,006,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10451/500000] + train/ActionNoiseL2Loss=0.1125 + throughput/total_tokens=2,006,592,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10452/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=2,006,784,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10453/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=2,006,976,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10454/500000] + train/ActionNoiseL2Loss=0.1040 + throughput/total_tokens=2,007,168,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10455/500000] + train/ActionNoiseL2Loss=0.0905 + throughput/total_tokens=2,007,360,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10456/500000] + train/ActionNoiseL2Loss=0.0286 + throughput/total_tokens=2,007,552,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10457/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=2,007,744,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10458/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=2,007,936,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10459/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=2,008,128,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10460/500000] + optim/total_grad_norm=2.123 + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=2,008,320,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10461/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=2,008,512,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10462/500000] + train/ActionNoiseL2Loss=0.0253 + throughput/total_tokens=2,008,704,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10463/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=2,008,896,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10464/500000] + train/ActionNoiseL2Loss=0.1140 + throughput/total_tokens=2,009,088,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10465/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=2,009,280,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10466/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=2,009,472,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10467/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=2,009,664,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10468/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=2,009,856,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10469/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=2,010,048,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10470/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=2,010,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10471/500000] + train/ActionNoiseL2Loss=0.0242 + throughput/total_tokens=2,010,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10472/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=2,010,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10473/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=2,010,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10474/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=2,011,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10475/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=2,011,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10476/500000] + train/ActionNoiseL2Loss=0.1238 + throughput/total_tokens=2,011,392,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10477/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=2,011,584,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10478/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=2,011,776,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10479/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=2,011,968,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10480/500000] + optim/total_grad_norm=1.197 + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=2,012,160,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10481/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=2,012,352,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10482/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=2,012,544,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10483/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=2,012,736,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10484/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=2,012,928,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10485/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=2,013,120,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10486/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=2,013,312,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10487/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=2,013,504,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10488/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=2,013,696,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10489/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=2,013,888,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10490/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=2,014,080,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10491/500000] + train/ActionNoiseL2Loss=0.0305 + throughput/total_tokens=2,014,272,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10492/500000] + train/ActionNoiseL2Loss=0.0901 + throughput/total_tokens=2,014,464,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10493/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=2,014,656,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10494/500000] + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=2,014,848,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10495/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=2,015,040,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10496/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=2,015,232,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10497/500000] + train/ActionNoiseL2Loss=0.0232 + throughput/total_tokens=2,015,424,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10498/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=2,015,616,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10499/500000] + train/ActionNoiseL2Loss=0.0345 + throughput/total_tokens=2,015,808,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10500/500000] + optim/total_grad_norm=1.243 + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=2,016,000,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +10/08 [06:55:23] INFO | >> Saving config... checkpoint.py:608 +10/08 [06:56:10] INFO | >> Saving model state... checkpoint.py:796 +10/08 [06:57:25] INFO | >> Saving optim state... checkpoint.py:811 +10/08 [06:58:58] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=10501/500000] + train/ActionNoiseL2Loss=0.0229 + throughput/total_tokens=2,016,192,000 + throughput/device/tokens_per_second=1,192 + throughput/device/batches_per_second=0.0497 +[step=10502/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=2,016,384,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=10503/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=2,016,576,000 + throughput/device/tokens_per_second=1,166 + throughput/device/batches_per_second=0.0486 +[step=10504/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=2,016,768,000 + throughput/device/tokens_per_second=1,163 + throughput/device/batches_per_second=0.0485 +[step=10505/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=2,016,960,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10506/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=2,017,152,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=10507/500000] + train/ActionNoiseL2Loss=0.0309 + throughput/total_tokens=2,017,344,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10508/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=2,017,536,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10509/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=2,017,728,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10510/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=2,017,920,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10511/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=2,018,112,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10512/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=2,018,304,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10513/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=2,018,496,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10514/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=2,018,688,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10515/500000] + train/ActionNoiseL2Loss=0.0204 + throughput/total_tokens=2,018,880,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10516/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=2,019,072,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10517/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=2,019,264,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10518/500000] + train/ActionNoiseL2Loss=0.0339 + throughput/total_tokens=2,019,456,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10519/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=2,019,648,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10520/500000] + optim/total_grad_norm=1.048 + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=2,019,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10521/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=2,020,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10522/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=2,020,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10523/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=2,020,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10524/500000] + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=2,020,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10525/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=2,020,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10526/500000] + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=2,020,992,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10527/500000] + train/ActionNoiseL2Loss=0.0408 + throughput/total_tokens=2,021,184,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10528/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=2,021,376,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10529/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=2,021,568,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10530/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=2,021,760,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10531/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=2,021,952,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10532/500000] + train/ActionNoiseL2Loss=0.0691 + throughput/total_tokens=2,022,144,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10533/500000] + train/ActionNoiseL2Loss=0.0207 + throughput/total_tokens=2,022,336,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10534/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=2,022,528,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10535/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=2,022,720,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10536/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=2,022,912,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10537/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=2,023,104,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10538/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=2,023,296,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10539/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=2,023,488,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10540/500000] + optim/total_grad_norm=1.505 + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=2,023,680,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10541/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=2,023,872,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10542/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=2,024,064,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10543/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=2,024,256,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10544/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=2,024,448,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10545/500000] + train/ActionNoiseL2Loss=0.0207 + throughput/total_tokens=2,024,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10546/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=2,024,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10547/500000] + train/ActionNoiseL2Loss=0.0355 + throughput/total_tokens=2,025,024,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10548/500000] + train/ActionNoiseL2Loss=0.0387 + throughput/total_tokens=2,025,216,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10549/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=2,025,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10550/500000] + train/ActionNoiseL2Loss=0.0241 + throughput/total_tokens=2,025,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10551/500000] + train/ActionNoiseL2Loss=0.0202 + throughput/total_tokens=2,025,792,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10552/500000] + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=2,025,984,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10553/500000] + train/ActionNoiseL2Loss=0.0222 + throughput/total_tokens=2,026,176,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10554/500000] + train/ActionNoiseL2Loss=0.0260 + throughput/total_tokens=2,026,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10555/500000] + train/ActionNoiseL2Loss=0.0301 + throughput/total_tokens=2,026,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10556/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=2,026,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10557/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=2,026,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10558/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=2,027,136,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10559/500000] + train/ActionNoiseL2Loss=0.0245 + throughput/total_tokens=2,027,328,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10560/500000] + optim/total_grad_norm=1.240 + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=2,027,520,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10561/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=2,027,712,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10562/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=2,027,904,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10563/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=2,028,096,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10564/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=2,028,288,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10565/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=2,028,480,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10566/500000] + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=2,028,672,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10567/500000] + train/ActionNoiseL2Loss=0.0311 + throughput/total_tokens=2,028,864,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10568/500000] + train/ActionNoiseL2Loss=0.0246 + throughput/total_tokens=2,029,056,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10569/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=2,029,248,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10570/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=2,029,440,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10571/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=2,029,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10572/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=2,029,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10573/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=2,030,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10574/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=2,030,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10575/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=2,030,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10576/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=2,030,592,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10577/500000] + train/ActionNoiseL2Loss=0.1581 + throughput/total_tokens=2,030,784,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10578/500000] + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=2,030,976,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10579/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=2,031,168,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10580/500000] + optim/total_grad_norm=1.367 + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=2,031,360,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10581/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=2,031,552,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10582/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=2,031,744,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10583/500000] + train/ActionNoiseL2Loss=0.0281 + throughput/total_tokens=2,031,936,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10584/500000] + train/ActionNoiseL2Loss=0.0252 + throughput/total_tokens=2,032,128,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10585/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=2,032,320,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10586/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=2,032,512,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10587/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=2,032,704,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10588/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=2,032,896,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10589/500000] + train/ActionNoiseL2Loss=0.0980 + throughput/total_tokens=2,033,088,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10590/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=2,033,280,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10591/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=2,033,472,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10592/500000] + train/ActionNoiseL2Loss=0.0250 + throughput/total_tokens=2,033,664,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10593/500000] + train/ActionNoiseL2Loss=0.1233 + throughput/total_tokens=2,033,856,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10594/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=2,034,048,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10595/500000] + train/ActionNoiseL2Loss=0.0944 + throughput/total_tokens=2,034,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10596/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=2,034,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10597/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=2,034,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10598/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=2,034,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10599/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=2,035,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10600/500000] + optim/total_grad_norm=0.9163 + train/ActionNoiseL2Loss=0.0238 + throughput/total_tokens=2,035,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10601/500000] + train/ActionNoiseL2Loss=0.1468 + throughput/total_tokens=2,035,392,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10602/500000] + train/ActionNoiseL2Loss=0.0318 + throughput/total_tokens=2,035,584,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10603/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=2,035,776,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10604/500000] + train/ActionNoiseL2Loss=0.0288 + throughput/total_tokens=2,035,968,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10605/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=2,036,160,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10606/500000] + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=2,036,352,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10607/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=2,036,544,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10608/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=2,036,736,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10609/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=2,036,928,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10610/500000] + train/ActionNoiseL2Loss=0.0302 + throughput/total_tokens=2,037,120,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10611/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=2,037,312,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10612/500000] + train/ActionNoiseL2Loss=0.0227 + throughput/total_tokens=2,037,504,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10613/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=2,037,696,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10614/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=2,037,888,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10615/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=2,038,080,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10616/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=2,038,272,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10617/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=2,038,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10618/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=2,038,656,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10619/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=2,038,848,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10620/500000] + optim/total_grad_norm=0.7004 + train/ActionNoiseL2Loss=0.0103 + throughput/total_tokens=2,039,040,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10621/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=2,039,232,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10622/500000] + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=2,039,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10623/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=2,039,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10624/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=2,039,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10625/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=2,040,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10626/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=2,040,192,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10627/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=2,040,384,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10628/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=2,040,576,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10629/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=2,040,768,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10630/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=2,040,960,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10631/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=2,041,152,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10632/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=2,041,344,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10633/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=2,041,536,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10634/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=2,041,728,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10635/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=2,041,920,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10636/500000] + train/ActionNoiseL2Loss=0.0145 + throughput/total_tokens=2,042,112,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10637/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=2,042,304,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10638/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=2,042,496,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10639/500000] + train/ActionNoiseL2Loss=0.0339 + throughput/total_tokens=2,042,688,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10640/500000] + optim/total_grad_norm=1.354 + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=2,042,880,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10641/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=2,043,072,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10642/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=2,043,264,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10643/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=2,043,456,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10644/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=2,043,648,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10645/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=2,043,840,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10646/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=2,044,032,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10647/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=2,044,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10648/500000] + train/ActionNoiseL2Loss=0.0329 + throughput/total_tokens=2,044,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10649/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=2,044,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10650/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=2,044,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10651/500000] + train/ActionNoiseL2Loss=0.0238 + throughput/total_tokens=2,044,992,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10652/500000] + train/ActionNoiseL2Loss=0.0270 + throughput/total_tokens=2,045,184,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10653/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=2,045,376,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10654/500000] + train/ActionNoiseL2Loss=0.0308 + throughput/total_tokens=2,045,568,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10655/500000] + train/ActionNoiseL2Loss=0.0262 + throughput/total_tokens=2,045,760,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10656/500000] + train/ActionNoiseL2Loss=0.0339 + throughput/total_tokens=2,045,952,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10657/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=2,046,144,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10658/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=2,046,336,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10659/500000] + train/ActionNoiseL2Loss=0.0324 + throughput/total_tokens=2,046,528,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10660/500000] + optim/total_grad_norm=0.6877 + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=2,046,720,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10661/500000] + train/ActionNoiseL2Loss=0.0239 + throughput/total_tokens=2,046,912,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10662/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=2,047,104,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10663/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=2,047,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10664/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=2,047,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10665/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=2,047,680,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10666/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=2,047,872,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10667/500000] + train/ActionNoiseL2Loss=0.0288 + throughput/total_tokens=2,048,064,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10668/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=2,048,256,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10669/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=2,048,448,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10670/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=2,048,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10671/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=2,048,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10672/500000] + train/ActionNoiseL2Loss=0.0301 + throughput/total_tokens=2,049,024,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10673/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=2,049,216,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10674/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=2,049,408,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10675/500000] + train/ActionNoiseL2Loss=0.0385 + throughput/total_tokens=2,049,600,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10676/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=2,049,792,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10677/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=2,049,984,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10678/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=2,050,176,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10679/500000] + train/ActionNoiseL2Loss=0.0274 + throughput/total_tokens=2,050,368,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10680/500000] + optim/total_grad_norm=1.235 + train/ActionNoiseL2Loss=0.0851 + throughput/total_tokens=2,050,560,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10681/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=2,050,752,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10682/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=2,050,944,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10683/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=2,051,136,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10684/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=2,051,328,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10685/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=2,051,520,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10686/500000] + train/ActionNoiseL2Loss=0.0315 + throughput/total_tokens=2,051,712,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10687/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=2,051,904,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10688/500000] + train/ActionNoiseL2Loss=0.0258 + throughput/total_tokens=2,052,096,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10689/500000] + train/ActionNoiseL2Loss=0.0792 + throughput/total_tokens=2,052,288,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10690/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=2,052,480,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10691/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=2,052,672,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10692/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=2,052,864,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10693/500000] + train/ActionNoiseL2Loss=0.0788 + throughput/total_tokens=2,053,056,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10694/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=2,053,248,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10695/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=2,053,440,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10696/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=2,053,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10697/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=2,053,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10698/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=2,054,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10699/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=2,054,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10700/500000] + optim/total_grad_norm=1.178 + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=2,054,400,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10701/500000] + train/ActionNoiseL2Loss=0.0300 + throughput/total_tokens=2,054,592,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10702/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=2,054,784,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10703/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=2,054,976,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10704/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=2,055,168,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10705/500000] + train/ActionNoiseL2Loss=0.0929 + throughput/total_tokens=2,055,360,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10706/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=2,055,552,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10707/500000] + train/ActionNoiseL2Loss=0.0225 + throughput/total_tokens=2,055,744,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10708/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=2,055,936,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10709/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=2,056,128,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10710/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=2,056,320,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10711/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=2,056,512,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10712/500000] + train/ActionNoiseL2Loss=0.0990 + throughput/total_tokens=2,056,704,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10713/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=2,056,896,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10714/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=2,057,088,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10715/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=2,057,280,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10716/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=2,057,472,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10717/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=2,057,664,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10718/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=2,057,856,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10719/500000] + train/ActionNoiseL2Loss=0.0294 + throughput/total_tokens=2,058,048,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10720/500000] + optim/total_grad_norm=1.007 + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=2,058,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10721/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=2,058,432,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10722/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=2,058,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10723/500000] + train/ActionNoiseL2Loss=0.1058 + throughput/total_tokens=2,058,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10724/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=2,059,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10725/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=2,059,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10726/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=2,059,392,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10727/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=2,059,584,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10728/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=2,059,776,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10729/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=2,059,968,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10730/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=2,060,160,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10731/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=2,060,352,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10732/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=2,060,544,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10733/500000] + train/ActionNoiseL2Loss=0.0316 + throughput/total_tokens=2,060,736,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10734/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=2,060,928,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10735/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=2,061,120,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10736/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=2,061,312,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10737/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=2,061,504,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10738/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=2,061,696,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10739/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=2,061,888,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10740/500000] + optim/total_grad_norm=1.191 + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=2,062,080,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10741/500000] + train/ActionNoiseL2Loss=0.0301 + throughput/total_tokens=2,062,272,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10742/500000] + train/ActionNoiseL2Loss=0.1101 + throughput/total_tokens=2,062,464,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10743/500000] + train/ActionNoiseL2Loss=0.0966 + throughput/total_tokens=2,062,656,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10744/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=2,062,848,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10745/500000] + train/ActionNoiseL2Loss=0.0408 + throughput/total_tokens=2,063,040,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10746/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=2,063,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10747/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=2,063,424,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10748/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=2,063,616,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10749/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=2,063,808,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10750/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=2,064,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10751/500000] + train/ActionNoiseL2Loss=0.0410 + throughput/total_tokens=2,064,192,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10752/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=2,064,384,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10753/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=2,064,576,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10754/500000] + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=2,064,768,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10755/500000] + train/ActionNoiseL2Loss=0.1244 + throughput/total_tokens=2,064,960,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10756/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=2,065,152,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10757/500000] + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=2,065,344,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10758/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=2,065,536,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10759/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=2,065,728,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10760/500000] + optim/total_grad_norm=1.466 + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=2,065,920,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10761/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=2,066,112,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10762/500000] + train/ActionNoiseL2Loss=0.0391 + throughput/total_tokens=2,066,304,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10763/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=2,066,496,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10764/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=2,066,688,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10765/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=2,066,880,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10766/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=2,067,072,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10767/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=2,067,264,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10768/500000] + train/ActionNoiseL2Loss=0.0315 + throughput/total_tokens=2,067,456,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10769/500000] + train/ActionNoiseL2Loss=0.0253 + throughput/total_tokens=2,067,648,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10770/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=2,067,840,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10771/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=2,068,032,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10772/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=2,068,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10773/500000] + train/ActionNoiseL2Loss=0.0261 + throughput/total_tokens=2,068,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10774/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=2,068,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10775/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=2,068,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10776/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=2,068,992,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10777/500000] + train/ActionNoiseL2Loss=0.0236 + throughput/total_tokens=2,069,184,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10778/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=2,069,376,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10779/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=2,069,568,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10780/500000] + optim/total_grad_norm=1.155 + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=2,069,760,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10781/500000] + train/ActionNoiseL2Loss=0.0229 + throughput/total_tokens=2,069,952,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10782/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=2,070,144,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10783/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=2,070,336,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10784/500000] + train/ActionNoiseL2Loss=0.0310 + throughput/total_tokens=2,070,528,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10785/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=2,070,720,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10786/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=2,070,912,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10787/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=2,071,104,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10788/500000] + train/ActionNoiseL2Loss=0.0296 + throughput/total_tokens=2,071,296,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10789/500000] + train/ActionNoiseL2Loss=0.0286 + throughput/total_tokens=2,071,488,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10790/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=2,071,680,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10791/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=2,071,872,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10792/500000] + train/ActionNoiseL2Loss=0.0338 + throughput/total_tokens=2,072,064,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10793/500000] + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=2,072,256,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10794/500000] + train/ActionNoiseL2Loss=0.0316 + throughput/total_tokens=2,072,448,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10795/500000] + train/ActionNoiseL2Loss=0.0302 + throughput/total_tokens=2,072,640,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10796/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=2,072,832,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10797/500000] + train/ActionNoiseL2Loss=0.0285 + throughput/total_tokens=2,073,024,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10798/500000] + train/ActionNoiseL2Loss=0.0361 + throughput/total_tokens=2,073,216,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10799/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=2,073,408,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10800/500000] + optim/total_grad_norm=1.209 + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=2,073,600,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10801/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=2,073,792,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10802/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=2,073,984,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10803/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=2,074,176,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10804/500000] + train/ActionNoiseL2Loss=0.0387 + throughput/total_tokens=2,074,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10805/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=2,074,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10806/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=2,074,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10807/500000] + train/ActionNoiseL2Loss=0.0325 + throughput/total_tokens=2,074,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10808/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=2,075,136,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10809/500000] + train/ActionNoiseL2Loss=0.0217 + throughput/total_tokens=2,075,328,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10810/500000] + train/ActionNoiseL2Loss=0.0266 + throughput/total_tokens=2,075,520,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10811/500000] + train/ActionNoiseL2Loss=0.0160 + throughput/total_tokens=2,075,712,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10812/500000] + train/ActionNoiseL2Loss=0.0278 + throughput/total_tokens=2,075,904,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10813/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=2,076,096,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10814/500000] + train/ActionNoiseL2Loss=0.0802 + throughput/total_tokens=2,076,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10815/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=2,076,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10816/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=2,076,672,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10817/500000] + train/ActionNoiseL2Loss=0.0275 + throughput/total_tokens=2,076,864,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10818/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=2,077,056,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10819/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=2,077,248,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10820/500000] + optim/total_grad_norm=1.465 + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=2,077,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10821/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=2,077,632,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10822/500000] + train/ActionNoiseL2Loss=0.0211 + throughput/total_tokens=2,077,824,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10823/500000] + train/ActionNoiseL2Loss=0.0820 + throughput/total_tokens=2,078,016,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10824/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=2,078,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10825/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=2,078,400,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10826/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=2,078,592,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10827/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=2,078,784,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10828/500000] + train/ActionNoiseL2Loss=0.0254 + throughput/total_tokens=2,078,976,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10829/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=2,079,168,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10830/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=2,079,360,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10831/500000] + train/ActionNoiseL2Loss=0.0241 + throughput/total_tokens=2,079,552,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10832/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=2,079,744,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10833/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=2,079,936,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10834/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=2,080,128,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10835/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=2,080,320,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10836/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=2,080,512,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10837/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=2,080,704,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10838/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=2,080,896,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10839/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=2,081,088,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10840/500000] + optim/total_grad_norm=1.172 + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=2,081,280,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10841/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=2,081,472,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10842/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=2,081,664,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10843/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=2,081,856,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10844/500000] + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=2,082,048,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10845/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=2,082,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10846/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=2,082,432,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10847/500000] + train/ActionNoiseL2Loss=0.0169 + throughput/total_tokens=2,082,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10848/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=2,082,816,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10849/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=2,083,008,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10850/500000] + train/ActionNoiseL2Loss=0.0224 + throughput/total_tokens=2,083,200,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10851/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=2,083,392,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10852/500000] + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=2,083,584,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10853/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=2,083,776,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10854/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=2,083,968,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10855/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=2,084,160,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10856/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=2,084,352,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10857/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=2,084,544,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10858/500000] + train/ActionNoiseL2Loss=0.0741 + throughput/total_tokens=2,084,736,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10859/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=2,084,928,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10860/500000] + optim/total_grad_norm=1.081 + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=2,085,120,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=10861/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=2,085,312,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10862/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=2,085,504,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10863/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=2,085,696,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10864/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=2,085,888,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10865/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=2,086,080,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10866/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=2,086,272,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10867/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=2,086,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10868/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=2,086,656,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10869/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=2,086,848,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10870/500000] + train/ActionNoiseL2Loss=0.0344 + throughput/total_tokens=2,087,040,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10871/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=2,087,232,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10872/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=2,087,424,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10873/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=2,087,616,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10874/500000] + train/ActionNoiseL2Loss=0.0249 + throughput/total_tokens=2,087,808,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10875/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=2,088,000,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10876/500000] + train/ActionNoiseL2Loss=0.0242 + throughput/total_tokens=2,088,192,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10877/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=2,088,384,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10878/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=2,088,576,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10879/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=2,088,768,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10880/500000] + optim/total_grad_norm=1.378 + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=2,088,960,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10881/500000] + train/ActionNoiseL2Loss=0.0285 + throughput/total_tokens=2,089,152,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10882/500000] + train/ActionNoiseL2Loss=0.0867 + throughput/total_tokens=2,089,344,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10883/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=2,089,536,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10884/500000] + train/ActionNoiseL2Loss=0.0411 + throughput/total_tokens=2,089,728,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10885/500000] + train/ActionNoiseL2Loss=0.0330 + throughput/total_tokens=2,089,920,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10886/500000] + train/ActionNoiseL2Loss=0.0155 + throughput/total_tokens=2,090,112,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10887/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=2,090,304,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10888/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=2,090,496,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10889/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=2,090,688,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10890/500000] + train/ActionNoiseL2Loss=0.0140 + throughput/total_tokens=2,090,880,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10891/500000] + train/ActionNoiseL2Loss=0.1061 + throughput/total_tokens=2,091,072,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10892/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=2,091,264,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10893/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=2,091,456,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10894/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=2,091,648,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10895/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=2,091,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10896/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=2,092,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10897/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=2,092,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10898/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=2,092,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10899/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=2,092,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10900/500000] + optim/total_grad_norm=1.139 + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=2,092,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10901/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=2,092,992,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10902/500000] + train/ActionNoiseL2Loss=0.0268 + throughput/total_tokens=2,093,184,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10903/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=2,093,376,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10904/500000] + train/ActionNoiseL2Loss=0.0914 + throughput/total_tokens=2,093,568,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10905/500000] + train/ActionNoiseL2Loss=0.0276 + throughput/total_tokens=2,093,760,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10906/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=2,093,952,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10907/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=2,094,144,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10908/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=2,094,336,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10909/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=2,094,528,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10910/500000] + train/ActionNoiseL2Loss=0.0192 + throughput/total_tokens=2,094,720,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10911/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=2,094,912,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10912/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=2,095,104,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10913/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=2,095,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10914/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=2,095,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10915/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=2,095,680,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10916/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=2,095,872,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10917/500000] + train/ActionNoiseL2Loss=0.0196 + throughput/total_tokens=2,096,064,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10918/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=2,096,256,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10919/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=2,096,448,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10920/500000] + optim/total_grad_norm=1.211 + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=2,096,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10921/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=2,096,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10922/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=2,097,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10923/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=2,097,216,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10924/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=2,097,408,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10925/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=2,097,600,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10926/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=2,097,792,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10927/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=2,097,984,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10928/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=2,098,176,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10929/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=2,098,368,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10930/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=2,098,560,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10931/500000] + train/ActionNoiseL2Loss=0.0210 + throughput/total_tokens=2,098,752,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10932/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=2,098,944,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10933/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=2,099,136,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10934/500000] + train/ActionNoiseL2Loss=0.0338 + throughput/total_tokens=2,099,328,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10935/500000] + train/ActionNoiseL2Loss=0.0229 + throughput/total_tokens=2,099,520,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10936/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=2,099,712,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10937/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=2,099,904,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10938/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=2,100,096,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10939/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=2,100,288,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10940/500000] + optim/total_grad_norm=1.293 + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=2,100,480,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10941/500000] + train/ActionNoiseL2Loss=0.0272 + throughput/total_tokens=2,100,672,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10942/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=2,100,864,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10943/500000] + train/ActionNoiseL2Loss=0.1299 + throughput/total_tokens=2,101,056,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10944/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=2,101,248,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10945/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=2,101,440,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10946/500000] + train/ActionNoiseL2Loss=0.0188 + throughput/total_tokens=2,101,632,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10947/500000] + train/ActionNoiseL2Loss=0.0309 + throughput/total_tokens=2,101,824,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10948/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=2,102,016,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=10949/500000] + train/ActionNoiseL2Loss=0.0149 + throughput/total_tokens=2,102,208,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=10950/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=2,102,400,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10951/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=2,102,592,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10952/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=2,102,784,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10953/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=2,102,976,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=10954/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=2,103,168,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10955/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=2,103,360,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10956/500000] + train/ActionNoiseL2Loss=0.0267 + throughput/total_tokens=2,103,552,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=10957/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=2,103,744,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10958/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=2,103,936,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10959/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=2,104,128,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10960/500000] + optim/total_grad_norm=1.914 + train/ActionNoiseL2Loss=0.0776 + throughput/total_tokens=2,104,320,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=10961/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=2,104,512,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=10962/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=2,104,704,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10963/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=2,104,896,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10964/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=2,105,088,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10965/500000] + train/ActionNoiseL2Loss=0.0295 + throughput/total_tokens=2,105,280,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10966/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=2,105,472,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10967/500000] + train/ActionNoiseL2Loss=0.1056 + throughput/total_tokens=2,105,664,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10968/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=2,105,856,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10969/500000] + train/ActionNoiseL2Loss=0.0315 + throughput/total_tokens=2,106,048,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=10970/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=2,106,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10971/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=2,106,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10972/500000] + train/ActionNoiseL2Loss=0.0273 + throughput/total_tokens=2,106,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10973/500000] + train/ActionNoiseL2Loss=0.0258 + throughput/total_tokens=2,106,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10974/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=2,107,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10975/500000] + train/ActionNoiseL2Loss=0.0233 + throughput/total_tokens=2,107,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10976/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=2,107,392,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10977/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=2,107,584,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10978/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=2,107,776,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10979/500000] + train/ActionNoiseL2Loss=0.0361 + throughput/total_tokens=2,107,968,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10980/500000] + optim/total_grad_norm=0.7127 + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=2,108,160,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=10981/500000] + train/ActionNoiseL2Loss=0.0911 + throughput/total_tokens=2,108,352,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10982/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=2,108,544,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10983/500000] + train/ActionNoiseL2Loss=0.1104 + throughput/total_tokens=2,108,736,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10984/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=2,108,928,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10985/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=2,109,120,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10986/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=2,109,312,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10987/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=2,109,504,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10988/500000] + train/ActionNoiseL2Loss=0.0832 + throughput/total_tokens=2,109,696,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10989/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=2,109,888,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=10990/500000] + train/ActionNoiseL2Loss=0.0187 + throughput/total_tokens=2,110,080,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=10991/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=2,110,272,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10992/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=2,110,464,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=10993/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=2,110,656,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10994/500000] + train/ActionNoiseL2Loss=0.0942 + throughput/total_tokens=2,110,848,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10995/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=2,111,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10996/500000] + train/ActionNoiseL2Loss=0.0265 + throughput/total_tokens=2,111,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10997/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=2,111,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10998/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=2,111,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=10999/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=2,111,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11000/500000] + optim/total_grad_norm=1.362 + train/ActionNoiseL2Loss=0.0408 + throughput/total_tokens=2,112,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +10/08 [09:53:28] INFO | >> Saving config... checkpoint.py:608 +10/08 [09:54:02] INFO | >> Saving model state... checkpoint.py:796 +10/08 [09:55:19] INFO | >> Saving optim state... checkpoint.py:811 +10/08 [09:56:51] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=11001/500000] + train/ActionNoiseL2Loss=0.1505 + throughput/total_tokens=2,112,192,000 + throughput/device/tokens_per_second=1,187 + throughput/device/batches_per_second=0.0495 +[step=11002/500000] + train/ActionNoiseL2Loss=0.0246 + throughput/total_tokens=2,112,384,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11003/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=2,112,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11004/500000] + train/ActionNoiseL2Loss=0.0946 + throughput/total_tokens=2,112,768,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11005/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=2,112,960,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=11006/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=2,113,152,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=11007/500000] + train/ActionNoiseL2Loss=0.0318 + throughput/total_tokens=2,113,344,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11008/500000] + train/ActionNoiseL2Loss=0.0256 + throughput/total_tokens=2,113,536,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11009/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=2,113,728,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11010/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=2,113,920,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11011/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=2,114,112,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11012/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=2,114,304,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11013/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=2,114,496,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11014/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=2,114,688,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11015/500000] + train/ActionNoiseL2Loss=0.1227 + throughput/total_tokens=2,114,880,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11016/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=2,115,072,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11017/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=2,115,264,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11018/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=2,115,456,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11019/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=2,115,648,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11020/500000] + optim/total_grad_norm=1.188 + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=2,115,840,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11021/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=2,116,032,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11022/500000] + train/ActionNoiseL2Loss=0.0324 + throughput/total_tokens=2,116,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11023/500000] + train/ActionNoiseL2Loss=0.0273 + throughput/total_tokens=2,116,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11024/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=2,116,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11025/500000] + train/ActionNoiseL2Loss=0.0329 + throughput/total_tokens=2,116,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11026/500000] + train/ActionNoiseL2Loss=0.0296 + throughput/total_tokens=2,116,992,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11027/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=2,117,184,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11028/500000] + train/ActionNoiseL2Loss=0.0343 + throughput/total_tokens=2,117,376,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11029/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=2,117,568,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11030/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=2,117,760,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11031/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=2,117,952,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11032/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=2,118,144,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11033/500000] + train/ActionNoiseL2Loss=0.0187 + throughput/total_tokens=2,118,336,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11034/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=2,118,528,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11035/500000] + train/ActionNoiseL2Loss=0.0231 + throughput/total_tokens=2,118,720,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11036/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=2,118,912,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11037/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=2,119,104,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11038/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=2,119,296,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11039/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=2,119,488,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11040/500000] + optim/total_grad_norm=0.8962 + train/ActionNoiseL2Loss=0.0370 + throughput/total_tokens=2,119,680,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11041/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=2,119,872,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11042/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=2,120,064,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11043/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=2,120,256,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11044/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=2,120,448,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11045/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=2,120,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11046/500000] + train/ActionNoiseL2Loss=0.0244 + throughput/total_tokens=2,120,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11047/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=2,121,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11048/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=2,121,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11049/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=2,121,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11050/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=2,121,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11051/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=2,121,792,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11052/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=2,121,984,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11053/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=2,122,176,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11054/500000] + train/ActionNoiseL2Loss=0.0843 + throughput/total_tokens=2,122,368,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11055/500000] + train/ActionNoiseL2Loss=0.1186 + throughput/total_tokens=2,122,560,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11056/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=2,122,752,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11057/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=2,122,944,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11058/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=2,123,136,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11059/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=2,123,328,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11060/500000] + optim/total_grad_norm=0.8510 + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=2,123,520,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11061/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=2,123,712,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11062/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=2,123,904,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11063/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=2,124,096,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11064/500000] + train/ActionNoiseL2Loss=0.0878 + throughput/total_tokens=2,124,288,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11065/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=2,124,480,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11066/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=2,124,672,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11067/500000] + train/ActionNoiseL2Loss=0.0282 + throughput/total_tokens=2,124,864,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11068/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=2,125,056,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11069/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=2,125,248,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11070/500000] + train/ActionNoiseL2Loss=0.0999 + throughput/total_tokens=2,125,440,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11071/500000] + train/ActionNoiseL2Loss=0.0279 + throughput/total_tokens=2,125,632,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11072/500000] + train/ActionNoiseL2Loss=0.0962 + throughput/total_tokens=2,125,824,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11073/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=2,126,016,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11074/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=2,126,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11075/500000] + train/ActionNoiseL2Loss=0.0182 + throughput/total_tokens=2,126,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11076/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=2,126,592,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11077/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=2,126,784,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11078/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=2,126,976,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11079/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=2,127,168,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11080/500000] + optim/total_grad_norm=1.278 + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=2,127,360,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11081/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=2,127,552,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11082/500000] + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=2,127,744,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11083/500000] + train/ActionNoiseL2Loss=0.0204 + throughput/total_tokens=2,127,936,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11084/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=2,128,128,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11085/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=2,128,320,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11086/500000] + train/ActionNoiseL2Loss=0.0962 + throughput/total_tokens=2,128,512,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11087/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=2,128,704,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11088/500000] + train/ActionNoiseL2Loss=0.0246 + throughput/total_tokens=2,128,896,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11089/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=2,129,088,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11090/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=2,129,280,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11091/500000] + train/ActionNoiseL2Loss=0.0253 + throughput/total_tokens=2,129,472,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11092/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=2,129,664,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11093/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=2,129,856,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11094/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=2,130,048,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11095/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=2,130,240,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11096/500000] + train/ActionNoiseL2Loss=0.0288 + throughput/total_tokens=2,130,432,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11097/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=2,130,624,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11098/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=2,130,816,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11099/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=2,131,008,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11100/500000] + optim/total_grad_norm=0.7170 + train/ActionNoiseL2Loss=0.0239 + throughput/total_tokens=2,131,200,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11101/500000] + train/ActionNoiseL2Loss=0.0879 + throughput/total_tokens=2,131,392,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11102/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=2,131,584,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11103/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=2,131,776,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11104/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=2,131,968,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11105/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=2,132,160,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11106/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=2,132,352,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11107/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=2,132,544,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11108/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=2,132,736,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11109/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=2,132,928,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11110/500000] + train/ActionNoiseL2Loss=0.0859 + throughput/total_tokens=2,133,120,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=11111/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=2,133,312,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11112/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=2,133,504,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11113/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=2,133,696,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11114/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=2,133,888,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11115/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=2,134,080,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11116/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=2,134,272,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11117/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=2,134,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11118/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=2,134,656,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11119/500000] + train/ActionNoiseL2Loss=0.0818 + throughput/total_tokens=2,134,848,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11120/500000] + optim/total_grad_norm=1.403 + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=2,135,040,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11121/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=2,135,232,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11122/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=2,135,424,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11123/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=2,135,616,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11124/500000] + train/ActionNoiseL2Loss=0.0184 + throughput/total_tokens=2,135,808,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11125/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=2,136,000,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11126/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=2,136,192,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11127/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=2,136,384,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11128/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=2,136,576,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11129/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=2,136,768,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11130/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=2,136,960,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11131/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=2,137,152,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11132/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=2,137,344,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11133/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=2,137,536,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11134/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=2,137,728,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11135/500000] + train/ActionNoiseL2Loss=0.0208 + throughput/total_tokens=2,137,920,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11136/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=2,138,112,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11137/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=2,138,304,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11138/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=2,138,496,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11139/500000] + train/ActionNoiseL2Loss=0.0097 + throughput/total_tokens=2,138,688,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11140/500000] + optim/total_grad_norm=1.546 + train/ActionNoiseL2Loss=0.0939 + throughput/total_tokens=2,138,880,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=11141/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=2,139,072,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11142/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=2,139,264,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11143/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=2,139,456,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11144/500000] + train/ActionNoiseL2Loss=0.0221 + throughput/total_tokens=2,139,648,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11145/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=2,139,840,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11146/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=2,140,032,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11147/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=2,140,224,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11148/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=2,140,416,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11149/500000] + train/ActionNoiseL2Loss=0.0315 + throughput/total_tokens=2,140,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11150/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=2,140,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=11151/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=2,140,992,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11152/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=2,141,184,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11153/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=2,141,376,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11154/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=2,141,568,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11155/500000] + train/ActionNoiseL2Loss=0.0297 + throughput/total_tokens=2,141,760,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11156/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=2,141,952,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11157/500000] + train/ActionNoiseL2Loss=0.0270 + throughput/total_tokens=2,142,144,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11158/500000] + train/ActionNoiseL2Loss=0.0297 + throughput/total_tokens=2,142,336,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11159/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=2,142,528,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11160/500000] + optim/total_grad_norm=0.6758 + train/ActionNoiseL2Loss=0.0178 + throughput/total_tokens=2,142,720,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11161/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=2,142,912,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11162/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=2,143,104,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11163/500000] + train/ActionNoiseL2Loss=0.0282 + throughput/total_tokens=2,143,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11164/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=2,143,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11165/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=2,143,680,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11166/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=2,143,872,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11167/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=2,144,064,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11168/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=2,144,256,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11169/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=2,144,448,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11170/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=2,144,640,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11171/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=2,144,832,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11172/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=2,145,024,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11173/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=2,145,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11174/500000] + train/ActionNoiseL2Loss=0.0340 + throughput/total_tokens=2,145,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11175/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=2,145,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11176/500000] + train/ActionNoiseL2Loss=0.0955 + throughput/total_tokens=2,145,792,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11177/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=2,145,984,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11178/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=2,146,176,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11179/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=2,146,368,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11180/500000] + optim/total_grad_norm=1.332 + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=2,146,560,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11181/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=2,146,752,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11182/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=2,146,944,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11183/500000] + train/ActionNoiseL2Loss=0.1054 + throughput/total_tokens=2,147,136,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11184/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=2,147,328,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11185/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=2,147,520,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11186/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=2,147,712,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11187/500000] + train/ActionNoiseL2Loss=0.0253 + throughput/total_tokens=2,147,904,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11188/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=2,148,096,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11189/500000] + train/ActionNoiseL2Loss=0.0278 + throughput/total_tokens=2,148,288,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11190/500000] + train/ActionNoiseL2Loss=0.0292 + throughput/total_tokens=2,148,480,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=11191/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=2,148,672,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11192/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=2,148,864,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11193/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=2,149,056,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11194/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=2,149,248,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11195/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=2,149,440,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11196/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=2,149,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11197/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=2,149,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11198/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=2,150,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11199/500000] + train/ActionNoiseL2Loss=0.0363 + throughput/total_tokens=2,150,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11200/500000] + optim/total_grad_norm=0.9374 + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=2,150,400,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=11201/500000] + train/ActionNoiseL2Loss=0.0255 + throughput/total_tokens=2,150,592,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11202/500000] + train/ActionNoiseL2Loss=0.0387 + throughput/total_tokens=2,150,784,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11203/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=2,150,976,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11204/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=2,151,168,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11205/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=2,151,360,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11206/500000] + train/ActionNoiseL2Loss=0.0963 + throughput/total_tokens=2,151,552,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11207/500000] + train/ActionNoiseL2Loss=0.0281 + throughput/total_tokens=2,151,744,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11208/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=2,151,936,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11209/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=2,152,128,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11210/500000] + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=2,152,320,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11211/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=2,152,512,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11212/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=2,152,704,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11213/500000] + train/ActionNoiseL2Loss=0.0326 + throughput/total_tokens=2,152,896,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11214/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=2,153,088,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11215/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=2,153,280,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11216/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=2,153,472,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11217/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=2,153,664,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11218/500000] + train/ActionNoiseL2Loss=0.1201 + throughput/total_tokens=2,153,856,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11219/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=2,154,048,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11220/500000] + optim/total_grad_norm=1.058 + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=2,154,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=11221/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=2,154,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11222/500000] + train/ActionNoiseL2Loss=0.0255 + throughput/total_tokens=2,154,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11223/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=2,154,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11224/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=2,155,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11225/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=2,155,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11226/500000] + train/ActionNoiseL2Loss=0.0337 + throughput/total_tokens=2,155,392,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11227/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=2,155,584,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11228/500000] + train/ActionNoiseL2Loss=0.0241 + throughput/total_tokens=2,155,776,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11229/500000] + train/ActionNoiseL2Loss=0.0290 + throughput/total_tokens=2,155,968,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11230/500000] + train/ActionNoiseL2Loss=0.1213 + throughput/total_tokens=2,156,160,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11231/500000] + train/ActionNoiseL2Loss=0.0112 + throughput/total_tokens=2,156,352,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11232/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=2,156,544,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11233/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=2,156,736,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11234/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=2,156,928,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11235/500000] + train/ActionNoiseL2Loss=0.0264 + throughput/total_tokens=2,157,120,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11236/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=2,157,312,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11237/500000] + train/ActionNoiseL2Loss=0.0297 + throughput/total_tokens=2,157,504,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11238/500000] + train/ActionNoiseL2Loss=0.0287 + throughput/total_tokens=2,157,696,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11239/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=2,157,888,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11240/500000] + optim/total_grad_norm=0.8558 + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=2,158,080,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11241/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=2,158,272,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11242/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=2,158,464,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11243/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=2,158,656,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11244/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=2,158,848,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11245/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=2,159,040,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11246/500000] + train/ActionNoiseL2Loss=0.0297 + throughput/total_tokens=2,159,232,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11247/500000] + train/ActionNoiseL2Loss=0.0278 + throughput/total_tokens=2,159,424,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11248/500000] + train/ActionNoiseL2Loss=0.0315 + throughput/total_tokens=2,159,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11249/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=2,159,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11250/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=2,160,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11251/500000] + train/ActionNoiseL2Loss=0.0802 + throughput/total_tokens=2,160,192,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11252/500000] + train/ActionNoiseL2Loss=0.0276 + throughput/total_tokens=2,160,384,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11253/500000] + train/ActionNoiseL2Loss=0.0305 + throughput/total_tokens=2,160,576,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11254/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=2,160,768,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11255/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=2,160,960,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11256/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=2,161,152,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11257/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=2,161,344,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11258/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=2,161,536,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11259/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=2,161,728,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11260/500000] + optim/total_grad_norm=1.136 + train/ActionNoiseL2Loss=0.0290 + throughput/total_tokens=2,161,920,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11261/500000] + train/ActionNoiseL2Loss=0.0975 + throughput/total_tokens=2,162,112,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11262/500000] + train/ActionNoiseL2Loss=0.0268 + throughput/total_tokens=2,162,304,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11263/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=2,162,496,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11264/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=2,162,688,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11265/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=2,162,880,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11266/500000] + train/ActionNoiseL2Loss=0.0308 + throughput/total_tokens=2,163,072,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11267/500000] + train/ActionNoiseL2Loss=0.0249 + throughput/total_tokens=2,163,264,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11268/500000] + train/ActionNoiseL2Loss=0.0290 + throughput/total_tokens=2,163,456,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11269/500000] + train/ActionNoiseL2Loss=0.0910 + throughput/total_tokens=2,163,648,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11270/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=2,163,840,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11271/500000] + train/ActionNoiseL2Loss=0.0925 + throughput/total_tokens=2,164,032,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11272/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=2,164,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11273/500000] + train/ActionNoiseL2Loss=0.0287 + throughput/total_tokens=2,164,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11274/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=2,164,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11275/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=2,164,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11276/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=2,164,992,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11277/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=2,165,184,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11278/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=2,165,376,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11279/500000] + train/ActionNoiseL2Loss=0.0387 + throughput/total_tokens=2,165,568,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11280/500000] + optim/total_grad_norm=0.9114 + train/ActionNoiseL2Loss=0.0220 + throughput/total_tokens=2,165,760,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11281/500000] + train/ActionNoiseL2Loss=0.0285 + throughput/total_tokens=2,165,952,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11282/500000] + train/ActionNoiseL2Loss=0.0289 + throughput/total_tokens=2,166,144,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11283/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=2,166,336,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11284/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=2,166,528,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11285/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=2,166,720,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11286/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=2,166,912,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11287/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=2,167,104,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11288/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=2,167,296,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11289/500000] + train/ActionNoiseL2Loss=0.0330 + throughput/total_tokens=2,167,488,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11290/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=2,167,680,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11291/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=2,167,872,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11292/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=2,168,064,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11293/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=2,168,256,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11294/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=2,168,448,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11295/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=2,168,640,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11296/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=2,168,832,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11297/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=2,169,024,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11298/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=2,169,216,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11299/500000] + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=2,169,408,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11300/500000] + optim/total_grad_norm=0.8113 + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=2,169,600,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11301/500000] + train/ActionNoiseL2Loss=0.0229 + throughput/total_tokens=2,169,792,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=11302/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=2,169,984,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=11303/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=2,170,176,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11304/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=2,170,368,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11305/500000] + train/ActionNoiseL2Loss=0.0248 + throughput/total_tokens=2,170,560,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11306/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=2,170,752,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=11307/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=2,170,944,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=11308/500000] + train/ActionNoiseL2Loss=0.0867 + throughput/total_tokens=2,171,136,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=11309/500000] + train/ActionNoiseL2Loss=0.0268 + throughput/total_tokens=2,171,328,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=11310/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=2,171,520,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=11311/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=2,171,712,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=11312/500000] + train/ActionNoiseL2Loss=0.0168 + throughput/total_tokens=2,171,904,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=11313/500000] + train/ActionNoiseL2Loss=0.1081 + throughput/total_tokens=2,172,096,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=11314/500000] + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=2,172,288,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11315/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=2,172,480,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11316/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=2,172,672,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11317/500000] + train/ActionNoiseL2Loss=0.0199 + throughput/total_tokens=2,172,864,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11318/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=2,173,056,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11319/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=2,173,248,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11320/500000] + optim/total_grad_norm=1.616 + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=2,173,440,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11321/500000] + train/ActionNoiseL2Loss=0.0345 + throughput/total_tokens=2,173,632,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11322/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=2,173,824,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11323/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=2,174,016,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11324/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=2,174,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11325/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=2,174,400,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11326/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=2,174,592,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11327/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=2,174,784,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11328/500000] + train/ActionNoiseL2Loss=0.0961 + throughput/total_tokens=2,174,976,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11329/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=2,175,168,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11330/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=2,175,360,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11331/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=2,175,552,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11332/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=2,175,744,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11333/500000] + train/ActionNoiseL2Loss=0.0192 + throughput/total_tokens=2,175,936,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11334/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=2,176,128,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11335/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=2,176,320,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11336/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=2,176,512,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11337/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=2,176,704,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11338/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=2,176,896,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11339/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=2,177,088,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11340/500000] + optim/total_grad_norm=1.343 + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=2,177,280,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11341/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=2,177,472,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11342/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=2,177,664,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11343/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=2,177,856,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11344/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=2,178,048,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11345/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=2,178,240,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11346/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=2,178,432,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11347/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=2,178,624,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11348/500000] + train/ActionNoiseL2Loss=0.1126 + throughput/total_tokens=2,178,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11349/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=2,179,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11350/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=2,179,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11351/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=2,179,392,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11352/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=2,179,584,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11353/500000] + train/ActionNoiseL2Loss=0.0209 + throughput/total_tokens=2,179,776,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11354/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=2,179,968,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11355/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=2,180,160,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11356/500000] + train/ActionNoiseL2Loss=0.0320 + throughput/total_tokens=2,180,352,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11357/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=2,180,544,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11358/500000] + train/ActionNoiseL2Loss=0.0302 + throughput/total_tokens=2,180,736,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11359/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=2,180,928,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11360/500000] + optim/total_grad_norm=0.9663 + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=2,181,120,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 + System/Peak GPU Memory (MB)=46,467 +[step=11361/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=2,181,312,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11362/500000] + train/ActionNoiseL2Loss=0.0247 + throughput/total_tokens=2,181,504,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11363/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=2,181,696,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11364/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=2,181,888,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11365/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=2,182,080,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11366/500000] + train/ActionNoiseL2Loss=0.0147 + throughput/total_tokens=2,182,272,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11367/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=2,182,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11368/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=2,182,656,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11369/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=2,182,848,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11370/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=2,183,040,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11371/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=2,183,232,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11372/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=2,183,424,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11373/500000] + train/ActionNoiseL2Loss=0.0285 + throughput/total_tokens=2,183,616,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11374/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=2,183,808,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11375/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=2,184,000,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11376/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=2,184,192,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11377/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=2,184,384,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11378/500000] + train/ActionNoiseL2Loss=0.0335 + throughput/total_tokens=2,184,576,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11379/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=2,184,768,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11380/500000] + optim/total_grad_norm=0.9405 + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=2,184,960,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11381/500000] + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=2,185,152,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11382/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=2,185,344,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11383/500000] + train/ActionNoiseL2Loss=0.0280 + throughput/total_tokens=2,185,536,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11384/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=2,185,728,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11385/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=2,185,920,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11386/500000] + train/ActionNoiseL2Loss=0.0185 + throughput/total_tokens=2,186,112,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11387/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=2,186,304,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11388/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=2,186,496,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11389/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=2,186,688,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11390/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=2,186,880,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11391/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=2,187,072,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11392/500000] + train/ActionNoiseL2Loss=0.0156 + throughput/total_tokens=2,187,264,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11393/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=2,187,456,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11394/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=2,187,648,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11395/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=2,187,840,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11396/500000] + train/ActionNoiseL2Loss=0.0263 + throughput/total_tokens=2,188,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11397/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=2,188,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11398/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=2,188,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11399/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=2,188,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11400/500000] + optim/total_grad_norm=0.8828 + train/ActionNoiseL2Loss=0.0262 + throughput/total_tokens=2,188,800,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11401/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=2,188,992,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=11402/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=2,189,184,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=11403/500000] + train/ActionNoiseL2Loss=0.0879 + throughput/total_tokens=2,189,376,000 + throughput/device/tokens_per_second=1,154 + throughput/device/batches_per_second=0.0481 +[step=11404/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=2,189,568,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11405/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=2,189,760,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11406/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=2,189,952,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11407/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=2,190,144,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11408/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=2,190,336,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11409/500000] + train/ActionNoiseL2Loss=0.0187 + throughput/total_tokens=2,190,528,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11410/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=2,190,720,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11411/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=2,190,912,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11412/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=2,191,104,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11413/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=2,191,296,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11414/500000] + train/ActionNoiseL2Loss=0.0262 + throughput/total_tokens=2,191,488,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11415/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=2,191,680,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11416/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=2,191,872,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11417/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=2,192,064,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11418/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=2,192,256,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11419/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=2,192,448,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11420/500000] + optim/total_grad_norm=1.353 + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=2,192,640,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11421/500000] + train/ActionNoiseL2Loss=0.0344 + throughput/total_tokens=2,192,832,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11422/500000] + train/ActionNoiseL2Loss=0.0261 + throughput/total_tokens=2,193,024,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11423/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=2,193,216,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11424/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=2,193,408,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11425/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=2,193,600,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11426/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=2,193,792,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11427/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=2,193,984,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11428/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=2,194,176,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11429/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=2,194,368,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11430/500000] + train/ActionNoiseL2Loss=0.0243 + throughput/total_tokens=2,194,560,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11431/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=2,194,752,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11432/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=2,194,944,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11433/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=2,195,136,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11434/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=2,195,328,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11435/500000] + train/ActionNoiseL2Loss=0.0241 + throughput/total_tokens=2,195,520,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11436/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=2,195,712,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11437/500000] + train/ActionNoiseL2Loss=0.0265 + throughput/total_tokens=2,195,904,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11438/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=2,196,096,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11439/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=2,196,288,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11440/500000] + optim/total_grad_norm=0.7206 + train/ActionNoiseL2Loss=0.0225 + throughput/total_tokens=2,196,480,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11441/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=2,196,672,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11442/500000] + train/ActionNoiseL2Loss=0.0298 + throughput/total_tokens=2,196,864,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11443/500000] + train/ActionNoiseL2Loss=0.0268 + throughput/total_tokens=2,197,056,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11444/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=2,197,248,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11445/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=2,197,440,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11446/500000] + train/ActionNoiseL2Loss=0.0248 + throughput/total_tokens=2,197,632,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11447/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=2,197,824,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11448/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=2,198,016,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11449/500000] + train/ActionNoiseL2Loss=0.0985 + throughput/total_tokens=2,198,208,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11450/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=2,198,400,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11451/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=2,198,592,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11452/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=2,198,784,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11453/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=2,198,976,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11454/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=2,199,168,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11455/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=2,199,360,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11456/500000] + train/ActionNoiseL2Loss=0.0267 + throughput/total_tokens=2,199,552,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11457/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=2,199,744,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11458/500000] + train/ActionNoiseL2Loss=0.0910 + throughput/total_tokens=2,199,936,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11459/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=2,200,128,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11460/500000] + optim/total_grad_norm=1.130 + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=2,200,320,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11461/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=2,200,512,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11462/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=2,200,704,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11463/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=2,200,896,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11464/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=2,201,088,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11465/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=2,201,280,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11466/500000] + train/ActionNoiseL2Loss=0.0917 + throughput/total_tokens=2,201,472,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11467/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=2,201,664,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11468/500000] + train/ActionNoiseL2Loss=0.0251 + throughput/total_tokens=2,201,856,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11469/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=2,202,048,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11470/500000] + train/ActionNoiseL2Loss=0.0207 + throughput/total_tokens=2,202,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=11471/500000] + train/ActionNoiseL2Loss=0.0330 + throughput/total_tokens=2,202,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11472/500000] + train/ActionNoiseL2Loss=0.0232 + throughput/total_tokens=2,202,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11473/500000] + train/ActionNoiseL2Loss=0.0180 + throughput/total_tokens=2,202,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11474/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=2,203,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11475/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=2,203,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11476/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=2,203,392,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11477/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=2,203,584,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11478/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=2,203,776,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11479/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=2,203,968,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11480/500000] + optim/total_grad_norm=1.136 + train/ActionNoiseL2Loss=0.0330 + throughput/total_tokens=2,204,160,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=11481/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=2,204,352,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11482/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=2,204,544,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11483/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=2,204,736,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11484/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=2,204,928,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11485/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=2,205,120,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11486/500000] + train/ActionNoiseL2Loss=0.0989 + throughput/total_tokens=2,205,312,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11487/500000] + train/ActionNoiseL2Loss=0.0340 + throughput/total_tokens=2,205,504,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11488/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=2,205,696,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11489/500000] + train/ActionNoiseL2Loss=0.0325 + throughput/total_tokens=2,205,888,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11490/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=2,206,080,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=11491/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=2,206,272,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=11492/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=2,206,464,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=11493/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=2,206,656,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=11494/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=2,206,848,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=11495/500000] + train/ActionNoiseL2Loss=0.0243 + throughput/total_tokens=2,207,040,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11496/500000] + train/ActionNoiseL2Loss=0.0344 + throughput/total_tokens=2,207,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11497/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=2,207,424,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11498/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=2,207,616,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11499/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=2,207,808,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11500/500000] + optim/total_grad_norm=0.7655 + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=2,208,000,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +10/08 [12:51:20] INFO | >> Saving config... checkpoint.py:608 +10/08 [12:51:52] INFO | >> Saving model state... checkpoint.py:796 +10/08 [12:53:06] INFO | >> Saving optim state... checkpoint.py:811 +10/08 [12:54:42] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=11501/500000] + train/ActionNoiseL2Loss=0.0259 + throughput/total_tokens=2,208,192,000 + throughput/device/tokens_per_second=1,193 + throughput/device/batches_per_second=0.0497 +[step=11502/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=2,208,384,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=11503/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=2,208,576,000 + throughput/device/tokens_per_second=1,164 + throughput/device/batches_per_second=0.0485 +[step=11504/500000] + train/ActionNoiseL2Loss=0.0316 + throughput/total_tokens=2,208,768,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11505/500000] + train/ActionNoiseL2Loss=0.0302 + throughput/total_tokens=2,208,960,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11506/500000] + train/ActionNoiseL2Loss=0.0931 + throughput/total_tokens=2,209,152,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11507/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=2,209,344,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11508/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=2,209,536,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11509/500000] + train/ActionNoiseL2Loss=0.0337 + throughput/total_tokens=2,209,728,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11510/500000] + train/ActionNoiseL2Loss=0.0216 + throughput/total_tokens=2,209,920,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=11511/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=2,210,112,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11512/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=2,210,304,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11513/500000] + train/ActionNoiseL2Loss=0.0186 + throughput/total_tokens=2,210,496,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11514/500000] + train/ActionNoiseL2Loss=0.0310 + throughput/total_tokens=2,210,688,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11515/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=2,210,880,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11516/500000] + train/ActionNoiseL2Loss=0.0284 + throughput/total_tokens=2,211,072,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11517/500000] + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=2,211,264,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11518/500000] + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=2,211,456,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11519/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=2,211,648,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11520/500000] + optim/total_grad_norm=0.9331 + train/ActionNoiseL2Loss=0.0294 + throughput/total_tokens=2,211,840,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11521/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=2,212,032,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11522/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=2,212,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11523/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=2,212,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11524/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=2,212,608,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11525/500000] + train/ActionNoiseL2Loss=0.0345 + throughput/total_tokens=2,212,800,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11526/500000] + train/ActionNoiseL2Loss=0.0309 + throughput/total_tokens=2,212,992,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11527/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=2,213,184,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11528/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=2,213,376,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11529/500000] + train/ActionNoiseL2Loss=0.1001 + throughput/total_tokens=2,213,568,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11530/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=2,213,760,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11531/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=2,213,952,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11532/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=2,214,144,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11533/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=2,214,336,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11534/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=2,214,528,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11535/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=2,214,720,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11536/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=2,214,912,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11537/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=2,215,104,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11538/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=2,215,296,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11539/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=2,215,488,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11540/500000] + optim/total_grad_norm=1.014 + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=2,215,680,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11541/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=2,215,872,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11542/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=2,216,064,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11543/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=2,216,256,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11544/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=2,216,448,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11545/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=2,216,640,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11546/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=2,216,832,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11547/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=2,217,024,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11548/500000] + train/ActionNoiseL2Loss=0.0240 + throughput/total_tokens=2,217,216,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11549/500000] + train/ActionNoiseL2Loss=0.0232 + throughput/total_tokens=2,217,408,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11550/500000] + train/ActionNoiseL2Loss=0.0259 + throughput/total_tokens=2,217,600,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11551/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=2,217,792,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11552/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=2,217,984,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11553/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=2,218,176,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11554/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=2,218,368,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11555/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=2,218,560,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11556/500000] + train/ActionNoiseL2Loss=0.0215 + throughput/total_tokens=2,218,752,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11557/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=2,218,944,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11558/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=2,219,136,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11559/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=2,219,328,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11560/500000] + optim/total_grad_norm=1.119 + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=2,219,520,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11561/500000] + train/ActionNoiseL2Loss=0.0183 + throughput/total_tokens=2,219,712,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11562/500000] + train/ActionNoiseL2Loss=0.0691 + throughput/total_tokens=2,219,904,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11563/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=2,220,096,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11564/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=2,220,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11565/500000] + train/ActionNoiseL2Loss=0.0253 + throughput/total_tokens=2,220,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11566/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=2,220,672,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11567/500000] + train/ActionNoiseL2Loss=0.0921 + throughput/total_tokens=2,220,864,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11568/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=2,221,056,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11569/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=2,221,248,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11570/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=2,221,440,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11571/500000] + train/ActionNoiseL2Loss=0.0910 + throughput/total_tokens=2,221,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11572/500000] + train/ActionNoiseL2Loss=0.1085 + throughput/total_tokens=2,221,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11573/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=2,222,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11574/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=2,222,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11575/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=2,222,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11576/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=2,222,592,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11577/500000] + train/ActionNoiseL2Loss=0.0270 + throughput/total_tokens=2,222,784,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11578/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=2,222,976,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11579/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=2,223,168,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11580/500000] + optim/total_grad_norm=1.222 + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=2,223,360,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11581/500000] + train/ActionNoiseL2Loss=0.0201 + throughput/total_tokens=2,223,552,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11582/500000] + train/ActionNoiseL2Loss=0.0259 + throughput/total_tokens=2,223,744,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11583/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=2,223,936,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11584/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=2,224,128,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11585/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=2,224,320,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11586/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=2,224,512,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11587/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=2,224,704,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11588/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=2,224,896,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11589/500000] + train/ActionNoiseL2Loss=0.0388 + throughput/total_tokens=2,225,088,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11590/500000] + train/ActionNoiseL2Loss=0.1100 + throughput/total_tokens=2,225,280,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11591/500000] + train/ActionNoiseL2Loss=0.0331 + throughput/total_tokens=2,225,472,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11592/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=2,225,664,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11593/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=2,225,856,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11594/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=2,226,048,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11595/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=2,226,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11596/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=2,226,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11597/500000] + train/ActionNoiseL2Loss=0.0320 + throughput/total_tokens=2,226,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11598/500000] + train/ActionNoiseL2Loss=0.1159 + throughput/total_tokens=2,226,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11599/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=2,227,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11600/500000] + optim/total_grad_norm=1.246 + train/ActionNoiseL2Loss=0.0239 + throughput/total_tokens=2,227,200,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=11601/500000] + train/ActionNoiseL2Loss=0.0237 + throughput/total_tokens=2,227,392,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11602/500000] + train/ActionNoiseL2Loss=0.0310 + throughput/total_tokens=2,227,584,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11603/500000] + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=2,227,776,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11604/500000] + train/ActionNoiseL2Loss=0.1085 + throughput/total_tokens=2,227,968,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11605/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=2,228,160,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11606/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=2,228,352,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11607/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=2,228,544,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11608/500000] + train/ActionNoiseL2Loss=0.0311 + throughput/total_tokens=2,228,736,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11609/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=2,228,928,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11610/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=2,229,120,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11611/500000] + train/ActionNoiseL2Loss=0.0201 + throughput/total_tokens=2,229,312,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11612/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=2,229,504,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11613/500000] + train/ActionNoiseL2Loss=0.0301 + throughput/total_tokens=2,229,696,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11614/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=2,229,888,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11615/500000] + train/ActionNoiseL2Loss=0.0823 + throughput/total_tokens=2,230,080,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11616/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=2,230,272,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11617/500000] + train/ActionNoiseL2Loss=0.1128 + throughput/total_tokens=2,230,464,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11618/500000] + train/ActionNoiseL2Loss=0.0195 + throughput/total_tokens=2,230,656,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11619/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=2,230,848,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11620/500000] + optim/total_grad_norm=0.5838 + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=2,231,040,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11621/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=2,231,232,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11622/500000] + train/ActionNoiseL2Loss=0.0935 + throughput/total_tokens=2,231,424,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11623/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=2,231,616,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11624/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=2,231,808,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11625/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=2,232,000,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11626/500000] + train/ActionNoiseL2Loss=0.0859 + throughput/total_tokens=2,232,192,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11627/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=2,232,384,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11628/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=2,232,576,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11629/500000] + train/ActionNoiseL2Loss=0.0884 + throughput/total_tokens=2,232,768,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11630/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=2,232,960,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11631/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=2,233,152,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11632/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=2,233,344,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11633/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=2,233,536,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11634/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=2,233,728,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11635/500000] + train/ActionNoiseL2Loss=0.0391 + throughput/total_tokens=2,233,920,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11636/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=2,234,112,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11637/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=2,234,304,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11638/500000] + train/ActionNoiseL2Loss=0.0151 + throughput/total_tokens=2,234,496,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11639/500000] + train/ActionNoiseL2Loss=0.0290 + throughput/total_tokens=2,234,688,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11640/500000] + optim/total_grad_norm=1.045 + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=2,234,880,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11641/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=2,235,072,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11642/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=2,235,264,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11643/500000] + train/ActionNoiseL2Loss=0.0981 + throughput/total_tokens=2,235,456,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11644/500000] + train/ActionNoiseL2Loss=0.0305 + throughput/total_tokens=2,235,648,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11645/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=2,235,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11646/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=2,236,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11647/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=2,236,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11648/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=2,236,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11649/500000] + train/ActionNoiseL2Loss=0.1428 + throughput/total_tokens=2,236,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11650/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=2,236,800,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11651/500000] + train/ActionNoiseL2Loss=0.0275 + throughput/total_tokens=2,236,992,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11652/500000] + train/ActionNoiseL2Loss=0.0241 + throughput/total_tokens=2,237,184,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11653/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=2,237,376,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11654/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=2,237,568,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11655/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=2,237,760,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11656/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=2,237,952,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11657/500000] + train/ActionNoiseL2Loss=0.1200 + throughput/total_tokens=2,238,144,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11658/500000] + train/ActionNoiseL2Loss=0.0281 + throughput/total_tokens=2,238,336,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11659/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=2,238,528,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11660/500000] + optim/total_grad_norm=1.356 + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=2,238,720,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11661/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=2,238,912,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11662/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=2,239,104,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11663/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=2,239,296,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11664/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=2,239,488,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11665/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=2,239,680,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11666/500000] + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=2,239,872,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11667/500000] + train/ActionNoiseL2Loss=0.0343 + throughput/total_tokens=2,240,064,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11668/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=2,240,256,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11669/500000] + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=2,240,448,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11670/500000] + train/ActionNoiseL2Loss=0.1041 + throughput/total_tokens=2,240,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11671/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=2,240,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11672/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=2,241,024,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11673/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=2,241,216,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11674/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=2,241,408,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11675/500000] + train/ActionNoiseL2Loss=0.0345 + throughput/total_tokens=2,241,600,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11676/500000] + train/ActionNoiseL2Loss=0.0331 + throughput/total_tokens=2,241,792,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11677/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=2,241,984,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11678/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=2,242,176,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11679/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=2,242,368,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11680/500000] + optim/total_grad_norm=1.012 + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=2,242,560,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11681/500000] + train/ActionNoiseL2Loss=0.1008 + throughput/total_tokens=2,242,752,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11682/500000] + train/ActionNoiseL2Loss=0.0325 + throughput/total_tokens=2,242,944,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11683/500000] + train/ActionNoiseL2Loss=0.0287 + throughput/total_tokens=2,243,136,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11684/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=2,243,328,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11685/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=2,243,520,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11686/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=2,243,712,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11687/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=2,243,904,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11688/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=2,244,096,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11689/500000] + train/ActionNoiseL2Loss=0.0324 + throughput/total_tokens=2,244,288,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11690/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=2,244,480,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11691/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=2,244,672,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11692/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=2,244,864,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11693/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=2,245,056,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11694/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=2,245,248,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11695/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=2,245,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11696/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=2,245,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11697/500000] + train/ActionNoiseL2Loss=0.0169 + throughput/total_tokens=2,245,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11698/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=2,246,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11699/500000] + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=2,246,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11700/500000] + optim/total_grad_norm=1.265 + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=2,246,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +wandb: WARNING A graphql request initiated by the public wandb API timed out (timeout=19 sec). Create a new API with an integer timeout larger than 19, e.g., `api = wandb.Api(timeout=29)` to increase the graphql timeout. +[step=11701/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=2,246,592,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 +[step=11702/500000] + train/ActionNoiseL2Loss=0.0329 + throughput/total_tokens=2,246,784,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 +[step=11703/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=2,246,976,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 +[step=11704/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=2,247,168,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 +[step=11705/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=2,247,360,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 +[step=11706/500000] + train/ActionNoiseL2Loss=0.0962 + throughput/total_tokens=2,247,552,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 +[step=11707/500000] + train/ActionNoiseL2Loss=0.0312 + throughput/total_tokens=2,247,744,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 +[step=11708/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=2,247,936,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 +[step=11709/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=2,248,128,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 +[step=11710/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=2,248,320,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 + System/Peak GPU Memory (MB)=46,467 +[step=11711/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=2,248,512,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 +[step=11712/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=2,248,704,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 +[step=11713/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=2,248,896,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 +[step=11714/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=2,249,088,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 +[step=11715/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=2,249,280,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 +[step=11716/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=2,249,472,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 +[step=11717/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=2,249,664,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 +[step=11718/500000] + train/ActionNoiseL2Loss=0.0272 + throughput/total_tokens=2,249,856,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 +[step=11719/500000] + train/ActionNoiseL2Loss=0.0343 + throughput/total_tokens=2,250,048,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0459 +[step=11720/500000] + optim/total_grad_norm=1.031 + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=2,250,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11721/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=2,250,432,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11722/500000] + train/ActionNoiseL2Loss=0.0292 + throughput/total_tokens=2,250,624,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11723/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=2,250,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11724/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=2,251,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11725/500000] + train/ActionNoiseL2Loss=0.0149 + throughput/total_tokens=2,251,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11726/500000] + train/ActionNoiseL2Loss=0.1044 + throughput/total_tokens=2,251,392,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11727/500000] + train/ActionNoiseL2Loss=0.0215 + throughput/total_tokens=2,251,584,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11728/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=2,251,776,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11729/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=2,251,968,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11730/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=2,252,160,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11731/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=2,252,352,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11732/500000] + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=2,252,544,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11733/500000] + train/ActionNoiseL2Loss=0.0133 + throughput/total_tokens=2,252,736,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11734/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=2,252,928,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11735/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=2,253,120,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11736/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=2,253,312,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11737/500000] + train/ActionNoiseL2Loss=0.0287 + throughput/total_tokens=2,253,504,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11738/500000] + train/ActionNoiseL2Loss=0.1023 + throughput/total_tokens=2,253,696,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11739/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=2,253,888,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11740/500000] + optim/total_grad_norm=1.503 + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=2,254,080,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11741/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=2,254,272,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11742/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=2,254,464,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11743/500000] + train/ActionNoiseL2Loss=0.0269 + throughput/total_tokens=2,254,656,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11744/500000] + train/ActionNoiseL2Loss=0.0230 + throughput/total_tokens=2,254,848,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11745/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=2,255,040,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11746/500000] + train/ActionNoiseL2Loss=0.0832 + throughput/total_tokens=2,255,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11747/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=2,255,424,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11748/500000] + train/ActionNoiseL2Loss=0.0231 + throughput/total_tokens=2,255,616,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11749/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=2,255,808,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11750/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=2,256,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11751/500000] + train/ActionNoiseL2Loss=0.0326 + throughput/total_tokens=2,256,192,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11752/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=2,256,384,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11753/500000] + train/ActionNoiseL2Loss=0.0370 + throughput/total_tokens=2,256,576,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11754/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=2,256,768,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11755/500000] + train/ActionNoiseL2Loss=0.0320 + throughput/total_tokens=2,256,960,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11756/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=2,257,152,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11757/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=2,257,344,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11758/500000] + train/ActionNoiseL2Loss=0.0859 + throughput/total_tokens=2,257,536,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11759/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=2,257,728,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11760/500000] + optim/total_grad_norm=0.9564 + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=2,257,920,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11761/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=2,258,112,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11762/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=2,258,304,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11763/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=2,258,496,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11764/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=2,258,688,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11765/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=2,258,880,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11766/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=2,259,072,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11767/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=2,259,264,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11768/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=2,259,456,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11769/500000] + train/ActionNoiseL2Loss=0.1073 + throughput/total_tokens=2,259,648,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11770/500000] + train/ActionNoiseL2Loss=0.0305 + throughput/total_tokens=2,259,840,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11771/500000] + train/ActionNoiseL2Loss=0.0915 + throughput/total_tokens=2,260,032,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11772/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=2,260,224,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11773/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=2,260,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11774/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=2,260,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11775/500000] + train/ActionNoiseL2Loss=0.0152 + throughput/total_tokens=2,260,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11776/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=2,260,992,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11777/500000] + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=2,261,184,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11778/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=2,261,376,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11779/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=2,261,568,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11780/500000] + optim/total_grad_norm=1.046 + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=2,261,760,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11781/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=2,261,952,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11782/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=2,262,144,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11783/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=2,262,336,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11784/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=2,262,528,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11785/500000] + train/ActionNoiseL2Loss=0.1006 + throughput/total_tokens=2,262,720,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11786/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=2,262,912,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11787/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=2,263,104,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11788/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=2,263,296,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11789/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=2,263,488,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11790/500000] + train/ActionNoiseL2Loss=0.1451 + throughput/total_tokens=2,263,680,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=11791/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=2,263,872,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11792/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=2,264,064,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11793/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=2,264,256,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=11794/500000] + train/ActionNoiseL2Loss=0.0296 + throughput/total_tokens=2,264,448,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=11795/500000] + train/ActionNoiseL2Loss=0.1034 + throughput/total_tokens=2,264,640,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=11796/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=2,264,832,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=11797/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=2,265,024,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=11798/500000] + train/ActionNoiseL2Loss=0.0332 + throughput/total_tokens=2,265,216,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=11799/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=2,265,408,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=11800/500000] + optim/total_grad_norm=1.134 + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=2,265,600,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=11801/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=2,265,792,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11802/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=2,265,984,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11803/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=2,266,176,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11804/500000] + train/ActionNoiseL2Loss=0.0303 + throughput/total_tokens=2,266,368,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11805/500000] + train/ActionNoiseL2Loss=0.0183 + throughput/total_tokens=2,266,560,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11806/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=2,266,752,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11807/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=2,266,944,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11808/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=2,267,136,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11809/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=2,267,328,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11810/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=2,267,520,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11811/500000] + train/ActionNoiseL2Loss=0.0831 + throughput/total_tokens=2,267,712,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11812/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=2,267,904,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11813/500000] + train/ActionNoiseL2Loss=0.1042 + throughput/total_tokens=2,268,096,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11814/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=2,268,288,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11815/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=2,268,480,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11816/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=2,268,672,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11817/500000] + train/ActionNoiseL2Loss=0.0331 + throughput/total_tokens=2,268,864,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11818/500000] + train/ActionNoiseL2Loss=0.0199 + throughput/total_tokens=2,269,056,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11819/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=2,269,248,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11820/500000] + optim/total_grad_norm=0.8740 + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=2,269,440,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=11821/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=2,269,632,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11822/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=2,269,824,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11823/500000] + train/ActionNoiseL2Loss=0.0258 + throughput/total_tokens=2,270,016,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11824/500000] + train/ActionNoiseL2Loss=0.0325 + throughput/total_tokens=2,270,208,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11825/500000] + train/ActionNoiseL2Loss=0.0281 + throughput/total_tokens=2,270,400,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11826/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=2,270,592,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11827/500000] + train/ActionNoiseL2Loss=0.0331 + throughput/total_tokens=2,270,784,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11828/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=2,270,976,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11829/500000] + train/ActionNoiseL2Loss=0.0255 + throughput/total_tokens=2,271,168,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11830/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=2,271,360,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11831/500000] + train/ActionNoiseL2Loss=0.0243 + throughput/total_tokens=2,271,552,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11832/500000] + train/ActionNoiseL2Loss=0.1037 + throughput/total_tokens=2,271,744,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11833/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=2,271,936,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11834/500000] + train/ActionNoiseL2Loss=0.0370 + throughput/total_tokens=2,272,128,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11835/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=2,272,320,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11836/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=2,272,512,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11837/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=2,272,704,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11838/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=2,272,896,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11839/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=2,273,088,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11840/500000] + optim/total_grad_norm=1.699 + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=2,273,280,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11841/500000] + train/ActionNoiseL2Loss=0.0363 + throughput/total_tokens=2,273,472,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11842/500000] + train/ActionNoiseL2Loss=0.0238 + throughput/total_tokens=2,273,664,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11843/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=2,273,856,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11844/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=2,274,048,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11845/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=2,274,240,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=11846/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=2,274,432,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11847/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=2,274,624,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11848/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=2,274,816,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11849/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=2,275,008,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=11850/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=2,275,200,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=11851/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=2,275,392,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11852/500000] + train/ActionNoiseL2Loss=0.0302 + throughput/total_tokens=2,275,584,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11853/500000] + train/ActionNoiseL2Loss=0.0303 + throughput/total_tokens=2,275,776,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11854/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=2,275,968,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11855/500000] + train/ActionNoiseL2Loss=0.0344 + throughput/total_tokens=2,276,160,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11856/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=2,276,352,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11857/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=2,276,544,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11858/500000] + train/ActionNoiseL2Loss=0.0291 + throughput/total_tokens=2,276,736,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11859/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=2,276,928,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11860/500000] + optim/total_grad_norm=0.9031 + train/ActionNoiseL2Loss=0.0271 + throughput/total_tokens=2,277,120,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11861/500000] + train/ActionNoiseL2Loss=0.0752 + throughput/total_tokens=2,277,312,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11862/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=2,277,504,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11863/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=2,277,696,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11864/500000] + train/ActionNoiseL2Loss=0.1411 + throughput/total_tokens=2,277,888,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11865/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=2,278,080,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11866/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=2,278,272,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11867/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=2,278,464,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11868/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=2,278,656,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11869/500000] + train/ActionNoiseL2Loss=0.0223 + throughput/total_tokens=2,278,848,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11870/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=2,279,040,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11871/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=2,279,232,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11872/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=2,279,424,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11873/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=2,279,616,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11874/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=2,279,808,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11875/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=2,280,000,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11876/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=2,280,192,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11877/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=2,280,384,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11878/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=2,280,576,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11879/500000] + train/ActionNoiseL2Loss=0.0236 + throughput/total_tokens=2,280,768,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11880/500000] + optim/total_grad_norm=1.009 + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=2,280,960,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11881/500000] + train/ActionNoiseL2Loss=0.0344 + throughput/total_tokens=2,281,152,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11882/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=2,281,344,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11883/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=2,281,536,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11884/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=2,281,728,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11885/500000] + train/ActionNoiseL2Loss=0.0287 + throughput/total_tokens=2,281,920,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11886/500000] + train/ActionNoiseL2Loss=0.0917 + throughput/total_tokens=2,282,112,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11887/500000] + train/ActionNoiseL2Loss=0.0313 + throughput/total_tokens=2,282,304,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11888/500000] + train/ActionNoiseL2Loss=0.0233 + throughput/total_tokens=2,282,496,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11889/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=2,282,688,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11890/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=2,282,880,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11891/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=2,283,072,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11892/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=2,283,264,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11893/500000] + train/ActionNoiseL2Loss=0.1316 + throughput/total_tokens=2,283,456,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11894/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=2,283,648,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11895/500000] + train/ActionNoiseL2Loss=0.0831 + throughput/total_tokens=2,283,840,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11896/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=2,284,032,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11897/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=2,284,224,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11898/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=2,284,416,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11899/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=2,284,608,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11900/500000] + optim/total_grad_norm=0.9097 + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=2,284,800,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11901/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=2,284,992,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11902/500000] + train/ActionNoiseL2Loss=0.0277 + throughput/total_tokens=2,285,184,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11903/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=2,285,376,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11904/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=2,285,568,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11905/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=2,285,760,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11906/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=2,285,952,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11907/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=2,286,144,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11908/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=2,286,336,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11909/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=2,286,528,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11910/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=2,286,720,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11911/500000] + train/ActionNoiseL2Loss=0.0251 + throughput/total_tokens=2,286,912,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=11912/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=2,287,104,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11913/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=2,287,296,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11914/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=2,287,488,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11915/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=2,287,680,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11916/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=2,287,872,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11917/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=2,288,064,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=11918/500000] + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=2,288,256,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11919/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=2,288,448,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=11920/500000] + optim/total_grad_norm=0.9310 + train/ActionNoiseL2Loss=0.0293 + throughput/total_tokens=2,288,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11921/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=2,288,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11922/500000] + train/ActionNoiseL2Loss=0.0840 + throughput/total_tokens=2,289,024,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11923/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=2,289,216,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11924/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=2,289,408,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11925/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=2,289,600,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11926/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=2,289,792,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11927/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=2,289,984,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11928/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=2,290,176,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11929/500000] + train/ActionNoiseL2Loss=0.0391 + throughput/total_tokens=2,290,368,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11930/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=2,290,560,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11931/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=2,290,752,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11932/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=2,290,944,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11933/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=2,291,136,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11934/500000] + train/ActionNoiseL2Loss=0.0945 + throughput/total_tokens=2,291,328,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11935/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=2,291,520,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11936/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=2,291,712,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11937/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=2,291,904,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11938/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=2,292,096,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11939/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=2,292,288,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11940/500000] + optim/total_grad_norm=0.8368 + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=2,292,480,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11941/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=2,292,672,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11942/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=2,292,864,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11943/500000] + train/ActionNoiseL2Loss=0.1031 + throughput/total_tokens=2,293,056,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11944/500000] + train/ActionNoiseL2Loss=0.0343 + throughput/total_tokens=2,293,248,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11945/500000] + train/ActionNoiseL2Loss=0.0340 + throughput/total_tokens=2,293,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11946/500000] + train/ActionNoiseL2Loss=0.0946 + throughput/total_tokens=2,293,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11947/500000] + train/ActionNoiseL2Loss=0.1041 + throughput/total_tokens=2,293,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11948/500000] + train/ActionNoiseL2Loss=0.0305 + throughput/total_tokens=2,294,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11949/500000] + train/ActionNoiseL2Loss=0.0238 + throughput/total_tokens=2,294,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=11950/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=2,294,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=11951/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=2,294,592,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=11952/500000] + train/ActionNoiseL2Loss=0.0331 + throughput/total_tokens=2,294,784,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=11953/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=2,294,976,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=11954/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=2,295,168,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=11955/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=2,295,360,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=11956/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=2,295,552,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=11957/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=2,295,744,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=11958/500000] + train/ActionNoiseL2Loss=0.0231 + throughput/total_tokens=2,295,936,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=11959/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=2,296,128,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=11960/500000] + optim/total_grad_norm=0.8263 + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=2,296,320,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 + System/Peak GPU Memory (MB)=46,467 +[step=11961/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=2,296,512,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=11962/500000] + train/ActionNoiseL2Loss=0.0135 + throughput/total_tokens=2,296,704,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=11963/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=2,296,896,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=11964/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=2,297,088,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=11965/500000] + train/ActionNoiseL2Loss=0.0251 + throughput/total_tokens=2,297,280,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=11966/500000] + train/ActionNoiseL2Loss=0.0138 + throughput/total_tokens=2,297,472,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=11967/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=2,297,664,000 + throughput/device/tokens_per_second=1,132 + throughput/device/batches_per_second=0.0472 +[step=11968/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=2,297,856,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=11969/500000] + train/ActionNoiseL2Loss=0.0278 + throughput/total_tokens=2,298,048,000 + throughput/device/tokens_per_second=1,132 + throughput/device/batches_per_second=0.0472 +[step=11970/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=2,298,240,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11971/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=2,298,432,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11972/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=2,298,624,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11973/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=2,298,816,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11974/500000] + train/ActionNoiseL2Loss=0.0184 + throughput/total_tokens=2,299,008,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11975/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=2,299,200,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11976/500000] + train/ActionNoiseL2Loss=0.0313 + throughput/total_tokens=2,299,392,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11977/500000] + train/ActionNoiseL2Loss=0.0206 + throughput/total_tokens=2,299,584,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11978/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=2,299,776,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11979/500000] + train/ActionNoiseL2Loss=0.0316 + throughput/total_tokens=2,299,968,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11980/500000] + optim/total_grad_norm=1.299 + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=2,300,160,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11981/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=2,300,352,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11982/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=2,300,544,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11983/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=2,300,736,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11984/500000] + train/ActionNoiseL2Loss=0.0314 + throughput/total_tokens=2,300,928,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11985/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=2,301,120,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11986/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=2,301,312,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11987/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=2,301,504,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11988/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=2,301,696,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11989/500000] + train/ActionNoiseL2Loss=0.0809 + throughput/total_tokens=2,301,888,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=11990/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=2,302,080,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=11991/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=2,302,272,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11992/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=2,302,464,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11993/500000] + train/ActionNoiseL2Loss=0.0906 + throughput/total_tokens=2,302,656,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11994/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=2,302,848,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11995/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=2,303,040,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11996/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=2,303,232,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11997/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=2,303,424,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11998/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=2,303,616,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=11999/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=2,303,808,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12000/500000] + optim/total_grad_norm=1.532 + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=2,304,000,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +10/08 [15:49:32] INFO | >> Saving config... checkpoint.py:608 +10/08 [15:50:07] INFO | >> Saving model state... checkpoint.py:796 +10/08 [15:51:25] INFO | >> Saving optim state... checkpoint.py:811 +10/08 [15:52:59] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=12001/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=2,304,192,000 + throughput/device/tokens_per_second=1,191 + throughput/device/batches_per_second=0.0497 +[step=12002/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=2,304,384,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=12003/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=2,304,576,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0485 +[step=12004/500000] + train/ActionNoiseL2Loss=0.0268 + throughput/total_tokens=2,304,768,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12005/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=2,304,960,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12006/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=2,305,152,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=12007/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=2,305,344,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=12008/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=2,305,536,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=12009/500000] + train/ActionNoiseL2Loss=0.0845 + throughput/total_tokens=2,305,728,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12010/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=2,305,920,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=12011/500000] + train/ActionNoiseL2Loss=0.0228 + throughput/total_tokens=2,306,112,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12012/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=2,306,304,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12013/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=2,306,496,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12014/500000] + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=2,306,688,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12015/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=2,306,880,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12016/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=2,307,072,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12017/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=2,307,264,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12018/500000] + train/ActionNoiseL2Loss=0.0937 + throughput/total_tokens=2,307,456,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12019/500000] + train/ActionNoiseL2Loss=0.0273 + throughput/total_tokens=2,307,648,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12020/500000] + optim/total_grad_norm=1.288 + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=2,307,840,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=12021/500000] + train/ActionNoiseL2Loss=0.0197 + throughput/total_tokens=2,308,032,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=12022/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=2,308,224,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=12023/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=2,308,416,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12024/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=2,308,608,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12025/500000] + train/ActionNoiseL2Loss=0.0217 + throughput/total_tokens=2,308,800,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12026/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=2,308,992,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12027/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=2,309,184,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12028/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=2,309,376,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12029/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=2,309,568,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12030/500000] + train/ActionNoiseL2Loss=0.0339 + throughput/total_tokens=2,309,760,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=12031/500000] + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=2,309,952,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12032/500000] + train/ActionNoiseL2Loss=0.0229 + throughput/total_tokens=2,310,144,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12033/500000] + train/ActionNoiseL2Loss=0.1054 + throughput/total_tokens=2,310,336,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12034/500000] + train/ActionNoiseL2Loss=0.1157 + throughput/total_tokens=2,310,528,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12035/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=2,310,720,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12036/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=2,310,912,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12037/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=2,311,104,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12038/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=2,311,296,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12039/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=2,311,488,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=12040/500000] + optim/total_grad_norm=1.107 + train/ActionNoiseL2Loss=0.0296 + throughput/total_tokens=2,311,680,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=12041/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=2,311,872,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=12042/500000] + train/ActionNoiseL2Loss=0.0370 + throughput/total_tokens=2,312,064,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=12043/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=2,312,256,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12044/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=2,312,448,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12045/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=2,312,640,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12046/500000] + train/ActionNoiseL2Loss=0.0246 + throughput/total_tokens=2,312,832,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12047/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=2,313,024,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12048/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=2,313,216,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12049/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=2,313,408,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=12050/500000] + train/ActionNoiseL2Loss=0.0226 + throughput/total_tokens=2,313,600,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=12051/500000] + train/ActionNoiseL2Loss=0.0148 + throughput/total_tokens=2,313,792,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=12052/500000] + train/ActionNoiseL2Loss=0.0122 + throughput/total_tokens=2,313,984,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=12053/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=2,314,176,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=12054/500000] + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=2,314,368,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=12055/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=2,314,560,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=12056/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=2,314,752,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=12057/500000] + train/ActionNoiseL2Loss=0.0410 + throughput/total_tokens=2,314,944,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=12058/500000] + train/ActionNoiseL2Loss=0.0258 + throughput/total_tokens=2,315,136,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=12059/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=2,315,328,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=12060/500000] + optim/total_grad_norm=1.295 + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=2,315,520,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=12061/500000] + train/ActionNoiseL2Loss=0.0284 + throughput/total_tokens=2,315,712,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0482 +[step=12062/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=2,315,904,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=12063/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=2,316,096,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=12064/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=2,316,288,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=12065/500000] + train/ActionNoiseL2Loss=0.0253 + throughput/total_tokens=2,316,480,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=12066/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=2,316,672,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=12067/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=2,316,864,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=12068/500000] + train/ActionNoiseL2Loss=0.0253 + throughput/total_tokens=2,317,056,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=12069/500000] + train/ActionNoiseL2Loss=0.0324 + throughput/total_tokens=2,317,248,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=12070/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=2,317,440,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=12071/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=2,317,632,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12072/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=2,317,824,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12073/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=2,318,016,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12074/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=2,318,208,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12075/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=2,318,400,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12076/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=2,318,592,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12077/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=2,318,784,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12078/500000] + train/ActionNoiseL2Loss=0.0285 + throughput/total_tokens=2,318,976,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12079/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=2,319,168,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12080/500000] + optim/total_grad_norm=1.375 + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=2,319,360,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=12081/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=2,319,552,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12082/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=2,319,744,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12083/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=2,319,936,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12084/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=2,320,128,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12085/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=2,320,320,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12086/500000] + train/ActionNoiseL2Loss=0.0955 + throughput/total_tokens=2,320,512,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12087/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=2,320,704,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12088/500000] + train/ActionNoiseL2Loss=0.0280 + throughput/total_tokens=2,320,896,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12089/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=2,321,088,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12090/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=2,321,280,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=12091/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=2,321,472,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12092/500000] + train/ActionNoiseL2Loss=0.0245 + throughput/total_tokens=2,321,664,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12093/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=2,321,856,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12094/500000] + train/ActionNoiseL2Loss=0.0949 + throughput/total_tokens=2,322,048,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12095/500000] + train/ActionNoiseL2Loss=0.0894 + throughput/total_tokens=2,322,240,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12096/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=2,322,432,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12097/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=2,322,624,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12098/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=2,322,816,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12099/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=2,323,008,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=12100/500000] + optim/total_grad_norm=0.9245 + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=2,323,200,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 + System/Peak GPU Memory (MB)=46,467 +[step=12101/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=2,323,392,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=12102/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=2,323,584,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=12103/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=2,323,776,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=12104/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=2,323,968,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=12105/500000] + train/ActionNoiseL2Loss=0.0903 + throughput/total_tokens=2,324,160,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=12106/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=2,324,352,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=12107/500000] + train/ActionNoiseL2Loss=0.0410 + throughput/total_tokens=2,324,544,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=12108/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=2,324,736,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=12109/500000] + train/ActionNoiseL2Loss=0.0265 + throughput/total_tokens=2,324,928,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=12110/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=2,325,120,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 + System/Peak GPU Memory (MB)=46,467 +[step=12111/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=2,325,312,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=12112/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=2,325,504,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=12113/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=2,325,696,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=12114/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=2,325,888,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=12115/500000] + train/ActionNoiseL2Loss=0.0267 + throughput/total_tokens=2,326,080,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=12116/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=2,326,272,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=12117/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=2,326,464,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=12118/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=2,326,656,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=12119/500000] + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=2,326,848,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=12120/500000] + optim/total_grad_norm=1.290 + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=2,327,040,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 + System/Peak GPU Memory (MB)=46,467 +[step=12121/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=2,327,232,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=12122/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=2,327,424,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=12123/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=2,327,616,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=12124/500000] + train/ActionNoiseL2Loss=0.0790 + throughput/total_tokens=2,327,808,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=12125/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=2,328,000,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 diff --git a/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/files/requirements.txt b/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/files/requirements.txt new file mode 100644 index 0000000000000000000000000000000000000000..5a5e971a5d9f3b6f6a75248e203682c5fbcd69e8 --- /dev/null +++ b/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/files/requirements.txt @@ -0,0 +1,286 @@ +ai2-molmo==0.0.0 +astunparse==1.6.3 +flatbuffers==25.2.10 +gast==0.6.0 +google-pasta==0.2.0 +h5py==3.14.0 +libclang==18.1.1 +Markdown==3.9 +namex==0.1.0 +opt_einsum==3.4.0 +optree==0.17.0 +tensorboard-data-server==0.7.2 +tensorflow-io-gcs-filesystem==0.37.1 +termcolor==3.1.0 +Werkzeug==3.1.3 +Brotli==1.1.0 +Farama-Notifications==0.0.4 +MarkupSafe==2.1.5 +PyYAML==6.0.2 +absl-py==2.3.1 +accelerate==1.10.1 +ai2-molmo==0.0.0 +aiofiles==24.1.0 +aiohappyeyeballs==2.6.1 +aiohttp==3.12.15 +aiosignal==1.4.0 +annotated-types==0.7.0 +antlr4-python3-runtime==4.9.3 +anyio==4.10.0 +array_record==0.8.1 +async-timeout==5.0.1 +attrs==25.3.0 +av==15.1.0 +backports.tarfile==1.2.0 +beaker-gantry==3.2.0 +beaker-py==2.5.0 +black==23.12.1 +blinker==1.9.0 +boltons==25.0.0 +boto3==1.40.33 +botocore==1.40.33 +build==1.3.0 +cached_path==1.7.3 +cached-property==2.0.1 +cachetools==5.5.2 +certifi==2025.8.3 +cffi==2.0.0 +charset-normalizer==3.4.3 +click==8.2.1 +click-help-colors==0.9.4 +click-option-group==0.5.7 +cloudpickle==3.1.1 +cmake==4.1.0 +contourpy==1.3.2 +cryptography==46.0.1 +cycler==0.12.1 +dataclass-extensions==0.2.3 +datasets==3.6.0 +decorator==5.2.1 +deepdiff==8.6.1 +diffusers==0.35.1 +dill==0.3.8 +distro==1.9.0 +dlimp==0.0.1 +dm-tree==0.1.9 +docutils==0.22.1 +draccus==0.10.0 +editdistance==0.8.1 +einops==0.8.1 +einops-exts==0.0.4 +et_xmlfile==2.0.0 +etils==1.13.0 +evdev==1.9.2 +exceptiongroup==1.3.0 +face==24.0.0 +fastapi==0.116.2 +ffmpy==0.6.1 +fiddle==0.3.0 +filelock==3.13.1 +Flask==3.1.2 +fonttools==4.60.0 +frozenlist==1.7.0 +fsspec==2023.9.2 +ftfy==6.3.1 +gcsfs==2023.9.2 +gitdb==4.0.12 +GitPython==3.1.45 +glom==24.11.0 +google-api-core==2.25.1 +google-auth==2.40.3 +google-auth-oauthlib==1.2.2 +google-cloud-core==2.4.3 +google-cloud-storage==2.19.0 +google-crc32c==1.7.1 +google-resumable-media==2.7.2 +googleapis-common-protos==1.70.0 +gradio==5.46.0 +gradio_client==1.13.0 +graphviz==0.21 +groovy==0.1.2 +grpcio==1.75.0 +gymnasium==0.29.1 +h11==0.16.0 +hf_transfer==0.1.9 +hf-xet==1.1.10 +httpcore==1.0.9 +httpx==0.28.1 +huggingface-hub==0.35.0 +id==1.5.0 +idna==3.10 +imageio==2.37.0 +imageio-ffmpeg==0.6.0 +importlib_metadata==8.7.0 +importlib_resources==6.5.2 +iniconfig==2.1.0 +inquirerpy==0.3.4 +isort==5.12.0 +itsdangerous==2.2.0 +jaraco.classes==3.4.0 +jaraco.context==6.0.1 +jaraco.functools==4.3.0 +jeepney==0.9.0 +Jinja2==3.1.4 +jiter==0.11.0 +jmespath==1.0.1 +joblib==1.5.2 +jsonlines==4.0.0 +keras==2.15.0 +keyring==25.6.0 +kiwisolver==1.4.9 +latex2sympy2_extended==1.10.2 +lerobot==0.3.4 +Levenshtein==0.27.1 +libcst==1.8.4 +lightning-utilities==0.15.2 +markdown-it-py==4.0.0 +math-verify==0.8.0 +matplotlib==3.10.6 +mdurl==0.1.2 +mergedeep==1.3.4 +ml-dtypes==0.2.0 +ml_dtypes==0.5.3 +more-itertools==10.8.0 +mpmath==1.3.0 +msgspec==0.19.0 +multidict==6.6.4 +multiprocess==0.70.16 +mypy==1.3.0 +mypy_extensions==1.1.0 +necessary==0.4.3 +networkx==3.3 +nh3==0.3.0 +nltk==3.9.1 +numpy==1.26.4 +oauthlib==3.3.1 +omegaconf==2.3.0 +openai==1.108.0 +opencv-python-headless==4.12.0.88 +OpenEXR==3.4.0 +openpyxl==3.1.5 +orderly-set==5.5.0 +orjson==3.11.3 +packaging==25.0 +pandas==2.3.2 +pathspec==0.12.1 +petname==2.6 +pfzy==0.3.4 +pillow==11.0.0 +pip==25.2 +platformdirs==4.4.0 +pluggy==1.6.0 +promise==2.3 +prompt_toolkit==3.0.52 +propcache==0.3.2 +proto-plus==1.26.1 +protobuf==4.21.12 +protobuf==6.32.1 +psutil==7.1.0 +pyarrow==21.0.0 +pyasn1==0.6.1 +pyasn1_modules==0.4.2 +pycparser==2.23 +pydantic==2.11.9 +pydantic_core==2.33.2 +pydub==0.25.1 +Pygments==2.19.2 +pynput==1.8.1 +pyparsing==3.2.4 +pyproject_hooks==1.2.0 +pyserial==3.5 +pytest==8.4.2 +pytest-sphinx==0.6.3 +python-dateutil==2.9.0.post0 +python-Levenshtein==0.27.1 +python-multipart==0.0.20 +python-xlib==0.33 +pytorch-triton-rocm==3.4.0 +pytz==2025.2 +pyyaml-include==1.4.1 +RapidFuzz==3.14.1 +readme_renderer==44.0 +regex==2025.9.1 +requests==2.32.5 +requests-oauthlib==2.0.0 +requests-toolbelt==1.0.0 +requirements-parser==0.13.0 +rerun-sdk==0.22.1 +rfc3986==2.0.0 +rich==13.9.4 +rsa==4.9.1 +ruff==0.13.0 +s3transfer==0.14.0 +safehttpx==0.1.6 +safetensors==0.6.2 +scikit-learn==1.7.2 +scipy==1.15.3 +SecretStorage==3.4.0 +semantic-version==2.10.0 +sentencepiece==0.2.1 +sentry-sdk==2.38.0 +setuptools==78.1.1 +shellingham==1.5.4 +six==1.17.0 +smart_open==7.3.1 +smashed==0.21.5 +smmap==5.0.2 +sniffio==1.3.1 +starlette==0.48.0 +sympy==1.13.3 +tensorboard==2.15.2 +tensorboard==2.19.0 +tensorflow==2.15.0 +tensorflow-addons==0.23.0 +tensorflow-datasets==4.9.3 +tensorflow-estimator==2.15.0 +tensorflow-graphics==2021.12.3 +tensorflow-metadata==1.17.2 +threadpoolctl==3.6.0 +timm==1.0.19 +tokenizers==0.22.0 +toml==0.10.2 +tomli==2.2.1 +tomlkit==0.13.3 +torch==2.8.0+rocm6.4 +torchcodec==0.5 +torchmetrics==1.8.2 +torchvision==0.23.0+rocm6.4 +tqdm==4.67.1 +transformers==4.56.1 +trimesh==4.8.2 +trouting==0.3.3 +twine==6.2.0 +typeguard==2.13.3 +typer==0.17.4 +typing_extensions==4.15.0 +typing-inspect==0.9.0 +typing-inspection==0.4.1 +tzdata==2025.2 +urllib3==2.5.0 +uvicorn==0.35.0 +wandb==0.21.4 +wcwidth==0.2.13 +websockets==15.0.1 +wheel==0.45.1 +wrapt==1.14.2 +xxhash==3.5.0 +yarl==1.20.1 +zipp==3.23.0 +lerobot==0.3.4 +minLoRA==0.1.0 +autocommand==2.2.2 +backports.tarfile==1.2.0 +importlib_metadata==8.0.0 +inflect==7.3.1 +jaraco.collections==5.1.0 +jaraco.context==5.3.0 +jaraco.functools==4.0.1 +jaraco.text==3.12.1 +more-itertools==10.3.0 +packaging==24.2 +platformdirs==4.2.2 +tomli==2.0.1 +typeguard==4.3.0 +typing_extensions==4.12.2 +wheel==0.45.1 +zipp==3.19.2 diff --git a/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/files/wandb-metadata.json b/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/files/wandb-metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..92dfc7fb52bfbb03f1dda473fb4c9947e547b832 --- /dev/null +++ b/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/files/wandb-metadata.json @@ -0,0 +1,204 @@ +{ + "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35", + "python": "CPython 3.10.18", + "startedAt": "2025-10-05T16:38:02.136539Z", + "args": [ + "qwen2_7b", + "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk_flow_matching", + "--vision_backbone", + "openai", + "--action_head", + "flow_matching", + "--seq_len", + "1600", + "--ft_llm", + "--checkpoint", + "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924", + "--device_train_microbatch_size", + "16", + "--global_batch_size", + "126", + "--dataset", + "vla_dataset_realworld", + "--llm_learning_rate", + "5e-5", + "--wandb_entity", + "henryeap", + "--wandb_project", + "a1-realworld", + "--wandb_run_name", + "cleandesk", + "--real_world_vla_config_path", + "vla_config_realworld/vla_config_cleandesk.yaml", + "--save_overwrite" + ], + "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py", + "codePath": "launch_scripts/train_vla.py", + "codePathLocal": "launch_scripts/train_vla.py", + "git": { + "remote": "https://github.com/Spatialtemporal-AI/A1.git", + "commit": "5071f59d87c6a976691323cbac66d7a988b0b4e7" + }, + "email": "ihenrykwok@outlook.com", + "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk_flow_matching/wandb", + "host": "auh7-1b-gpu-320", + "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10", + "cpu_count": 64, + "cpu_count_logical": 128, + "gpu": "Instinct MI210", + "gpu_count": 8, + "disk": { + "/": { + "total": "3778763694080", + "used": "55512412160" + } + }, + "memory": { + "total": "2434606968832" + }, + "gpu_amd": [ + { + "id": "0", + "uniqueId": "0xdc567fc68d1a0c91", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "1", + "uniqueId": "0xc976bbc2ad247ea6", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "5", + "uniqueId": "0xc7fbd07780c2f202", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "7", + "uniqueId": "0xe56b0d719426d5a8", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "3", + "uniqueId": "0xa7a04689129eefa4", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "4", + "uniqueId": "0xec560c9e435b50ba", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "2", + "uniqueId": "0xcbcb7103099a436c", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "6", + "uniqueId": "0x5bb2d7fad259574f", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + } + ], + "slurm": { + "cluster_name": "ai-04r", + "conf": "/etc/slurm/slurm.conf", + "cpus_on_node": "128", + "gpus_on_node": "8", + "gtids": "0", + "job_account": "faculty-acc", + "job_cpus_per_node": "128", + "job_end_time": "1759941420", + "job_gid": "2000", + "job_gpus": "0,1,2,3,4,5,6,7", + "job_id": "2281", + "job_name": "mh_cleandesk_flow_matching", + "job_nodelist": "auh7-1b-gpu-320", + "job_num_nodes": "1", + "job_partition": "faculty", + "job_qos": "xdqos", + "job_start_time": "1759682220", + "job_uid": "2013", + "job_user": "xiaodan", + "jobid": "2281", + "localid": "0", + "nnodes": "1", + "nodeid": "0", + "nodelist": "auh7-1b-gpu-320", + "nprocs": "1", + "ntasks": "1", + "ntasks_per_node": "1", + "oom_kill_step": "0", + "prio_process": "0", + "procid": "0", + "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts", + "submit_host": "auh-1b-cpu-login-001", + "task_pid": "561699", + "tasks_per_node": "1", + "topology_addr": "auh7-1b-gpu-320", + "topology_addr_pattern": "node" + }, + "writerId": "cg68x37yky6rbl9tr7pshd5fx8s61qiy" +} \ No newline at end of file diff --git a/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/logs/debug-core.log b/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/logs/debug-core.log new file mode 100644 index 0000000000000000000000000000000000000000..ed38932a1c18d277f4473feef372badcf8df0da9 --- /dev/null +++ b/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/logs/debug-core.log @@ -0,0 +1,6 @@ +{"time":"2025-10-05T16:38:02.386747526Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpn27ektbq/port-561890.txt","pid":561890,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false} +{"time":"2025-10-05T16:38:02.388360677Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":561890} +{"time":"2025-10-05T16:38:02.389267188Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-561890-562080-1724540830/socket","Net":"unix"}} +{"time":"2025-10-05T16:38:02.586570534Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"} +{"time":"2025-10-05T16:38:02.600696794Z","level":"INFO","msg":"handleInformInit: received","streamId":"gqyapbwp","id":"1(@)"} +{"time":"2025-10-05T16:38:03.762891268Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"gqyapbwp","id":"1(@)"} diff --git a/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/logs/debug-internal.log b/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/logs/debug-internal.log new file mode 100644 index 0000000000000000000000000000000000000000..1ba7edbb8635596525174158f909fd1d567e371b --- /dev/null +++ b/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/logs/debug-internal.log @@ -0,0 +1,12 @@ +{"time":"2025-10-05T16:38:02.602917026Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"} +{"time":"2025-10-05T16:38:03.762826737Z","level":"INFO","msg":"stream: created new stream","id":"gqyapbwp"} +{"time":"2025-10-05T16:38:03.762885338Z","level":"INFO","msg":"stream: started","id":"gqyapbwp"} +{"time":"2025-10-05T16:38:03.762906828Z","level":"INFO","msg":"writer: started","stream_id":"gqyapbwp"} +{"time":"2025-10-05T16:38:03.762906838Z","level":"INFO","msg":"sender: started","stream_id":"gqyapbwp"} +{"time":"2025-10-05T16:38:03.762920708Z","level":"INFO","msg":"handler: started","stream_id":"gqyapbwp"} +{"time":"2025-10-06T19:04:19.555419176Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded"} +{"time":"2025-10-06T20:03:34.950654374Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded"} +{"time":"2025-10-07T15:02:38.499153299Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded"} +{"time":"2025-10-07T21:28:37.643147942Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"} +{"time":"2025-10-07T22:22:44.986859439Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"} +{"time":"2025-10-07T23:26:33.122893273Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/henryeap/a1-realworld/gqyapbwp/file_stream","body":"\n\n\n502 Server Error\n\n\n

Error: Server Error

\n

The server encountered a temporary error and could not complete your request.

Please try again in 30 seconds.

\n

\n\n"} diff --git a/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/logs/debug.log b/cleandesk_flow_matching/wandb/wandb/run-20251005_163802-gqyapbwp/logs/debug.log new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/cleandesk_l1_regression/wandb/wandb/debug-internal.log b/cleandesk_l1_regression/wandb/wandb/debug-internal.log new file mode 100644 index 0000000000000000000000000000000000000000..46affc2ba51fb5f59733037d81f939926d62e073 --- /dev/null +++ b/cleandesk_l1_regression/wandb/wandb/debug-internal.log @@ -0,0 +1,12 @@ +{"time":"2025-10-08T16:38:32.19998745Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"} +{"time":"2025-10-08T16:38:33.339827981Z","level":"INFO","msg":"stream: created new stream","id":"76mxu43t"} +{"time":"2025-10-08T16:38:33.339874102Z","level":"INFO","msg":"stream: started","id":"76mxu43t"} +{"time":"2025-10-08T16:38:33.339905492Z","level":"INFO","msg":"handler: started","stream_id":"76mxu43t"} +{"time":"2025-10-08T16:38:33.339893552Z","level":"INFO","msg":"writer: started","stream_id":"76mxu43t"} +{"time":"2025-10-08T16:38:33.339947873Z","level":"INFO","msg":"sender: started","stream_id":"76mxu43t"} +{"time":"2025-10-08T16:43:58.756754711Z","level":"INFO","msg":"handler: operation stats","stats":{"operations":[{"desc":"updating run metadata","runtime_seconds":0.006574606}],"total_operations":1}} +{"time":"2025-10-08T16:43:59.766243448Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"} +{"time":"2025-10-08T16:44:00.127335826Z","level":"INFO","msg":"stream: closing","id":"76mxu43t"} +{"time":"2025-10-08T16:44:00.127349836Z","level":"INFO","msg":"handler: closed","stream_id":"76mxu43t"} +{"time":"2025-10-08T16:44:00.128408003Z","level":"INFO","msg":"sender: closed","stream_id":"76mxu43t"} +{"time":"2025-10-08T16:44:00.128424754Z","level":"INFO","msg":"stream: closed","id":"76mxu43t"} diff --git a/cleandesk_l1_regression/wandb/wandb/debug.log b/cleandesk_l1_regression/wandb/wandb/debug.log new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/files/config.yaml b/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/files/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..299386348a4b4bbe7bff50dd2fb8e617ee04d39c --- /dev/null +++ b/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/files/config.yaml @@ -0,0 +1,623 @@ +_wandb: + value: + cli_version: 0.21.4 + e: + 9zghejqbkg668a368vduhoyzhbv4wgq6: + args: + - qwen2_7b + - save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk_l1_regression + - --vision_backbone + - openai + - --action_head + - l1_regression + - --seq_len + - "1600" + - --ft_llm + - --checkpoint + - /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924 + - --device_train_microbatch_size + - "16" + - --global_batch_size + - "126" + - --dataset + - vla_dataset_realworld + - --llm_learning_rate + - "5e-5" + - --wandb_entity + - henryeap + - --wandb_project + - a1-realworld + - --wandb_run_name + - cleandesk + - --real_world_vla_config_path + - vla_config_realworld/vla_config_cleandesk.yaml + - --save_overwrite + codePath: launch_scripts/train_vla.py + codePathLocal: launch_scripts/train_vla.py + cpu_count: 64 + cpu_count_logical: 128 + disk: + /: + total: "470343073792" + used: "50668195840" + email: ihenrykwok@outlook.com + executable: /vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10 + git: + commit: 49712a42d21a8c739a16ba5eeaec4a0d7b29ab80 + remote: https://github.com/Spatialtemporal-AI/A1.git + gpu: Instinct MI210 + gpu_amd: + - id: "3" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0x62b25d667064a7ff" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "6" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0xbdb93fac1aa97618" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "7" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0x850c5a1ff5d005be" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "2" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0x7a3e2781f4182456" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "4" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0x4c21a2ad76408df6" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "0" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0xa8d2c33980704bf2" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "1" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0xd13265721a117b54" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + - id: "5" + maxPower: "300.0" + mclkRange: 400Mhz - 1600Mhz + model: "0x740f" + performanceLevel: auto + sclkRange: 500Mhz - 1700Mhz + series: Instinct MI210 + sku: D67301V + uniqueId: "0x19ee82506963794b" + vbiosVersion: 113-D67301V-073 + vendor: Advanced Micro Devices, Inc. [AMD/ATI] + gpu_count: 8 + host: auh7-1b-gpu-316 + memory: + total: "2434606952448" + os: Linux-5.15.0-140-generic-x86_64-with-glibc2.35 + program: /vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py + python: CPython 3.10.18 + root: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk_l1_regression/wandb + slurm: + cluster_name: ai-04r + conf: /etc/slurm/slurm.conf + cpus_on_node: "128" + gpus_on_node: "8" + gtids: "0" + job_account: faculty-acc + job_cpus_per_node: "128" + job_end_time: "1760200645" + job_gid: "2000" + job_gpus: 0,1,2,3,4,5,6,7 + job_id: "2282" + job_name: mh_cleandesk_l1_regression + job_nodelist: auh7-1b-gpu-316 + job_num_nodes: "1" + job_partition: faculty + job_qos: xdqos + job_start_time: "1759941445" + job_uid: "2013" + job_user: xiaodan + jobid: "2282" + localid: "0" + nnodes: "1" + nodeid: "0" + nodelist: auh7-1b-gpu-316 + nprocs: "1" + ntasks: "1" + ntasks_per_node: "1" + oom_kill_step: "0" + prio_process: "0" + procid: "0" + submit_dir: /vast/users/xiaodan/zhangjian/A1/launch_scripts + submit_host: auh-1b-cpu-login-001 + task_pid: "1925818" + tasks_per_node: "1" + topology_addr: auh7-1b-gpu-316 + topology_addr_pattern: node + startedAt: "2025-10-08T16:38:31.938958Z" + writerId: 9zghejqbkg668a368vduhoyzhbv4wgq6 + m: [] + python_version: 3.10.18 + t: + "1": + - 1 + - 2 + - 3 + - 5 + - 11 + - 41 + - 49 + - 51 + - 53 + - 63 + - 71 + - 83 + - 95 + - 105 + "2": + - 1 + - 2 + - 3 + - 5 + - 11 + - 41 + - 49 + - 51 + - 53 + - 63 + - 71 + - 83 + - 95 + - 105 + "3": + - 2 + - 13 + - 15 + - 16 + - 61 + "4": 3.10.18 + "5": 0.21.4 + "6": 4.56.1 + "10": + - 19 + "12": 0.21.4 + "13": linux-x86_64 +activation_checkpointing: + value: whole_layer +allow_resume: + value: false +batch_divisor: + value: global_batch +canceled_check_interval: + value: 50 +checkpoint_dir: + value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924 +compile: + value: null +console_log_interval: + value: 1 +data: + value: + dataset: vla_dataset_realworld + drop_last: true + for_inference: false + lerobot_episode_index_end: null + lerobot_episode_index_start: null + mixture: null + multi_modal: torch + num_workers: 0 + pad: to_max + persistent_workers: false + pin_memory: true + prefetch_factor: null + rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds + rlds_dataset_name: libero_4_task_suites_no_noops + rlds_read_threads: 8 + rlds_shuffle_buffer_size: 100000 + rlds_traj_threads: 8 + root_size_mixture: null + seed: 95818 + sequence_length: 1600 + shuffle: true + shuffle_messages: false + split: train + timeout: 0 + use_proprio: true + use_wrist_image: true +device_eval_batch_size: + value: 4 +device_inf_eval_batch_size: + value: 16 +device_train_batch_size: + value: 15 +device_train_grad_accum: + value: 0 +device_train_microbatch_size: + value: 16 +dry_run: + value: false +early_exit: + value: false +epoch: + value: null +eval_interval: + value: 0 +eval_on_load: + value: false +eval_subset_num_batches: + value: -1 +evaluators: + value: + - data: + dataset: vla_dataset_realworld + drop_last: true + for_inference: false + lerobot_episode_index_end: 765 + lerobot_episode_index_start: 353 + mixture: null + multi_modal: torch + num_workers: 0 + pad: to_max + persistent_workers: true + pin_memory: true + prefetch_factor: null + rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds + rlds_dataset_name: libero_4_task_suites_no_noops + rlds_read_threads: 8 + rlds_shuffle_buffer_size: 256000 + rlds_traj_threads: 8 + root_size_mixture: null + seed: null + sequence_length: 1600 + shuffle: false + shuffle_messages: false + split: validation + timeout: 0 + use_proprio: true + use_wrist_image: true + device_eval_batch_size: null + eval_name: null + label: val + max_examples: null + max_new_tokens: 448 + mm_evaluator: null + save_dir: null + save_to_checkpoint_dir: false + skip_if_metrics_cached: true + subset_num_batches: 64 +extra_steps_after_cancel: + value: 10 +fast_forward_batches: + value: null +force_save_unsharded: + value: false +fsdp: + value: + hybrid_sharding_num_model_replicas: null + precision: float + sharding_strategy: FULL_SHARD + use_orig_params: true + wrapping_strategy: by_block_and_size +ft_connector: + value: false +ft_embedding: + value: lm_head +ft_llm: + value: true +ft_vit: + value: false +fused_loss: + value: null +gen1_gc_interval: + value: 1 +global_train_batch_size: + value: 126 +inf_eval_interval: + value: -1 +inf_eval_subset_num_batches: + value: -1 +inf_evaluators: + value: [] +initial_model_checkpoint: + value: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924 +keep_lr_on_load: + value: true +load_model_config: + value: null +load_path: + value: null +load_path_sharded_checkpointer: + value: null +lora: + value: false +lora_connector: + value: false +lora_llm: + value: false +lora_rank: + value: 8 +lora_vit: + value: false +max_duration: + value: 500000 +max_grad_norm: + value: 1 +max_grad_norm_ratio: + value: null +model: + value: + action_dim: 7 + action_head: l1_regression + action_head_dit_depth: 28 + action_head_dit_hidden_size: 1152 + action_head_dit_num_heads: 16 + action_tokenizer: + identifier: physical-intelligence/fast + tokenizer_dir: null + action_use_left_eef: true + action_use_mobile_base: false + activation_type: swiglu + additional_vocab_size: 128 + always_start_with_space: true + attention_dropout: 0 + attention_layer_norm: false + attention_layer_norm_with_affine: true + attention_type: sdpa + bias_for_layer_norm: null + block_group_size: 1 + block_type: sequential + clip_qkv: null + crop_mode: overlap-and-resize-c2 + d_model: 3584 + default_inference_len: 65 + embedding_dropout: 0 + embedding_size: 152064 + ff_out_size: null + fix_image_padding: true + float32_attention: true + head_dim: null + horizon: 8 + image_feature_dropout: 0 + image_padding_embed: pad_and_partial_pad + image_pooling_2d: attention_meanq + image_pooling_h: 2 + image_pooling_w: 2 + image_projector: mlp + include_bias: false + init_cutoff_factor: null + init_device: null + init_fn: normal + init_std: 0.02 + initializer_range: 0.02 + layer_norm_eps: 1e-06 + layer_norm_type: rms + layer_norm_with_affine: true + llm_causal_attention: false + llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt + low_cpu_fsdp: true + max_crops: 12 + max_position_embeddings: null + max_sequence_length: 4096 + message_formatting: role + mlp_hidden_size: 37888 + mlp_ratio: 4 + moe_capacity_factor: 1.25 + moe_dropless: true + moe_interleave: false + moe_lbl_in_fp32: false + moe_log_expert_assignment: false + moe_loss_weight: 0.1 + moe_mlp_impl: sparse + moe_num_experts: 8 + moe_shared_expert: false + moe_top_k: 2 + moe_zloss_weight: null + multi_annotation_weighting: root_subsegments + n_heads: 28 + n_kv_heads: 4 + n_layers: 28 + new_embedding_init_range: 0.02 + norm_after: false + normalize_input_embeds: false + num_diffusion_inference_steps: 30 + num_diffusion_steps: 1000 + overlap_margins: + - 4 + - 4 + pad_tokenizer: true + pad_value: 0 + precision: amp_bf16 + prompt_type: uber_model + qkv_bias: true + residual_dropout: 0.1 + response_residual_dropout: 0 + rope: true + rope_full_precision: true + rope_theta: 1e+06 + scale_logits: false + system_prompt_kind: demo_or_style + tokenizer: + identifier: Qwen/Qwen2-7B + tokenizer_dir: null + use_col_tokens: true + use_position_ids: true + use_proprio: true + vision_backbone: + attention_dropout: 0 + fsdp_wrap: false + image_default_input_size: + - 336 + - 336 + image_dropout_rate: 0 + image_emb_dim: 1024 + image_head_dim: 64 + image_mlp_activations: quick_gelu + image_mlp_dim: 4096 + image_model_type: openai + image_norm_eps: 1e-05 + image_num_heads: 16 + image_num_key_value_heads: 16 + image_num_layers: 23 + image_num_pos: 577 + image_patch_size: 14 + image_pos_patch_size: 14 + initializer_range: 0.02 + residual_dropout: 0 + resize_mode: default + vit_layers: + - -2 + - -9 + vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt + vocab_size: 152064 + weight_tying: false +multi_component_grad_norm: + value: true +no_pre_train_checkpoint: + value: true +optimizer: + value: + betas: + - 0.9 + - 0.95 + connector_betas: + - 0.9 + - 0.95 + connector_eps: 1e-06 + connector_learning_rate: 0.0002 + connector_weight_decay: 0 + eps: 1e-05 + learning_rate: 0.0001 + llm_betas: + - 0.9 + - 0.95 + llm_eps: 1e-06 + llm_learning_rate: 5e-05 + llm_weight_decay: 0 + metrics_log_interval: 20 + name: adamw + vit_betas: + - 0.9 + - 0.95 + vit_eps: 1e-06 + vit_learning_rate: 6e-06 + vit_weight_decay: 0 + weight_decay: 0.01 +precision: + value: amp_bf16 +python_profiling: + value: false +remote_save_folder: + value: null +reset_dataloader_state: + value: false +reset_optimizer_state: + value: false +reset_trainer_state: + value: false +restore_dataloader: + value: true +run_name: + value: cleandesk_20251008_163754 +save_dataloader_state: + value: false +save_folder: + value: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk_l1_regression +save_interval: + value: 500 +save_interval_action_head: + value: 500 +save_interval_ephemeral: + value: null +save_interval_unsharded: + value: 500 +save_num_action_head_checkpoints_to_keep: + value: 2 +save_num_checkpoints_to_keep: + value: 1 +save_num_unsharded_checkpoints_to_keep: + value: 1 +save_overwrite: + value: true +scheduler: + value: + alpha_f: 0.1 + connector_t_warmup: 200 + grad_clip_warmup_factor: null + grad_clip_warmup_steps: null + llm_t_warmup: 2000 + name: multimodal + t_max: null + t_warmup: 100 + units: steps + vit_t_warmup: 2000 + warmup_min_lr: 0 +seed: + value: 6198 +sharded_checkpointer: + value: torch_legacy +softmax_auxiliary_loss: + value: true +softmax_auxiliary_loss_scale: + value: 0.0001 +speed_monitor: + value: + gpu_flops_available: null + window_size: 20 +stop_after: + value: null +stop_at: + value: 500000 +time_limit: + value: null +torch_profiling: + value: false +train_exit_random_layer: + value: false +use_lora: + value: false diff --git a/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/files/output.log b/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/files/output.log new file mode 100644 index 0000000000000000000000000000000000000000..bfa8240834c38c3de2ef5f5c119487d3d81c9890 --- /dev/null +++ b/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/files/output.log @@ -0,0 +1,183 @@ +wandb: Detected [openai] in use. +wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script. +wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/ +10/08 [16:38:34] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109 + device id is provided via `init_process_group` or `barrier `. Using the current device set by the user. + warnings.warn( # warn only once + +****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_CleanDesk', 8, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 8, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 8, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}} +****** Skip RLDS main; path not found: None +****** start build LeRobot main... +build_tokenizer, cache_dir None tokenizer_dir None +10/08 [16:38:35] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:130 +10/08 [16:38:36] INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:436 +****** before LeRobot dataset... +****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_CleanDesk +****** length of the dataset: 72641 +10/08 [16:38:42] INFO | >> build_rlds_train_dataset: Loading train dataset: vla_dataset_realworld/train __init__.py:519 +****** Import RLDSBatchTransform, RLDSDataset successfully. +****** before RLDS dataset... +****** data_config.rlds_dataset_name: a1_real_world +****** data_config.rlds_data_root_dir: /vast/users/xiaodan/zhangjian/datasets/OXE +214************** + INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 87212/87212 [00:43<00:00, 2004.76it/s] +214************** +10/08 [16:39:30] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/jaco_play/0.1.0/dataset_statistics_e081d4716a3da95df91c79d661ae59fa26a43da49db4bf8d716b622b56 + 3b0ea3.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/berkeley_cable_routing/0.1.0/dataset_statistics_08cb4c5b7c5e6c035fc84ea85b2d54c0c46ad608a8763 + 4ebb18374088d23cd76.json. +214************** +10/08 [16:39:31] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/viola/0.1.0/dataset_statistics_2415d8f7de73c8761fedd7c2a9590667fb0d3fdd26664bf4c100222e5cdb89 + b9.json. +214************** + INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 1000/1000 [00:05<00:00, 184.79it/s] +214************** +10/08 [16:39:38] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/austin_buds_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_ccecde24cc01793b221 + 4eb0c4c5d7cc0e3ccc623db99bd892b83552b20decfb7.json. +214************** +10/08 [16:39:39] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 456/456 [00:24<00:00, 18.55it/s] +214************** +10/08 [16:40:06] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 5100/5100 [00:57<00:00, 88.36it/s] +214************** +10/08 [16:41:08] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 240/240 [00:08<00:00, 29.80it/s] +214************** +10/08 [16:41:20] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/austin_sirius_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_cb2e0273f80029a19 + dc3dbb3a3a4118a5598e7bff3ff0245891255825b04b42a.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/dlr_edan_shared_control_converted_externally_to_rlds/0.1.0/dataset_statistics_b8984563fc3e7ea + c0803c667ef58c9deaf2e747683568306ea1d83505d532a76.json. +214************** +10/08 [16:41:21] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 1500/1500 [00:02<00:00, 664.65it/s] +214************** +10/08 [16:41:24] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/berkeley_fanuc_manipulation/0.1.0/dataset_statistics_a98d349d0364668095ea3ca38c6785e94f35e5e5 + 8e234c88fac83775a923b0d0.json. +214************** +10/08 [16:41:25] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 43264/43264 [00:32<00:00, 1321.74it/s] +214************** +10/08 [16:42:02] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/roboturk/0.1.0/dataset_statistics_3aa821e17a2937f941d4102cfadcb1154853cb45dcec07ccc66893b01f6 + f1b40.json. +214************** +10/08 [16:42:03] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 1003/1003 [00:00<00:00, 1714.08it/s] +214************** +10/08 [16:42:04] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/ucsd_kitchen_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_1f1a5f310a2d5a6edc + 0e217370e135c8c8598290f11f57025037adcb0d033926.json. +214************** +10/08 [16:42:05] INFO | >> [*] Computing dataset statistics. This may take a bit, but should only need to happen once. data_utils.py:227 +100%|██████████| 631/631 [00:00<00:00, 1276.86it/s] + +###################################################################################### +# Loading the following 18 datasets (incl. sampling weight): # +# fractal20220817_data: ====================================================0.529250 # +# jaco_play: ===============================================================0.010898 # +# berkeley_cable_routing: ==================================================0.005916 # +# viola: ===================================================================0.021337 # +# berkeley_autolab_ur5: ====================================================0.027379 # +# austin_buds_dataset_converted_externally_to_rlds: ========================0.004768 # +# nyu_franka_play_dataset_converted_externally_to_rlds: ====================0.018817 # +# furniture_bench_dataset_converted_externally_to_rlds: ====================0.055185 # +# austin_sailor_dataset_converted_externally_to_rlds: ======================0.049354 # +# austin_sirius_dataset_converted_externally_to_rlds: ======================0.039129 # +# dlr_edan_shared_control_converted_externally_to_rlds: ====================0.001248 # +# utaustin_mutex: ==========================================================0.050583 # +# berkeley_fanuc_manipulation: =============================================0.017504 # +# bc_z: ====================================================================0.168166 # +# roboturk: ================================================================0.000131 # +# toto: ====================================================================0.000228 # +# ucsd_kitchen_dataset_converted_externally_to_rlds: =======================0.000006 # +# iamlab_cmu_pickup_insert_converted_externally_to_rlds: ===================0.000102 # +###################################################################################### + +10/08 [16:42:06] INFO | >> [*] Threads per Dataset: [14 1 1 1 1 1 1 2 1 1 1 1 1 5 1 1 1 1] dataset.py:563 + INFO | >> [*] Reads per Dataset: [14 1 1 1 1 1 1 2 1 1 1 1 1 5 1 1 1 1] dataset.py:564 + INFO | >> [*] Constructing datasets... dataset.py:567 +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +10/08 [16:42:11] INFO | >> [*] Applying frame transforms on dataset... dataset.py:607 +****** after RLDSDataset initialization! +****** length of the dataset: 7154275 +****** Build rlds train dataset: IterableDatasetWrapper successfully. +****** path: None +****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None +****** After build vla train dataset... +****** iterable_sources: [, ] +****** Before build mixed iterable dataset... +****** Build vla train dataloader successfully! +************************* Build train_dataloader successful! +************************* Before build_inf_evaluators + WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109 + device id is provided via `init_process_group` or `barrier `. Using the current device set by the user. + warnings.warn( # warn only once + +************************* Build evaluators successful! +************************* Early exit flags: early_exit=False +PROPRIO_DIM 16 does not match ACTION_DIM 16 for AffordVLA +************************* Initialize model successful! +***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt +***** Load checkpoint successful! +missing keys: ['action_head.model.layer_norm1.weight', 'action_head.model.layer_norm1.bias', 'action_head.model.fc1.weight', 'action_head.model.fc1.bias', 'action_head.model.mlp_resnet_blocks.0.ffn.0.weight', 'action_head.model.mlp_resnet_blocks.0.ffn.0.bias', 'action_head.model.mlp_resnet_blocks.0.ffn.1.weight', 'action_head.model.mlp_resnet_blocks.0.ffn.1.bias', 'action_head.model.mlp_resnet_blocks.1.ffn.0.weight', 'action_head.model.mlp_resnet_blocks.1.ffn.0.bias', 'action_head.model.mlp_resnet_blocks.1.ffn.1.weight', 'action_head.model.mlp_resnet_blocks.1.ffn.1.bias', 'action_head.model.layer_norm2.weight', 'action_head.model.layer_norm2.bias', 'action_head.model.fc2.weight', 'action_head.model.fc2.bias', 'proprio_projector.fc1.weight', 'proprio_projector.fc1.bias', 'proprio_projector.fc2.weight', 'proprio_projector.fc2.bias'] +unexpected keys: [] +************************* Initialize model successful! +************************* Before FSDP model wrapping +************************* FSDP model wrapping successful! +************************* Before building optimizer and scheduler +10/08 [16:43:46] INFO | >> Constructing optimizer with 2 param groups optim.py:1283 +************************************************** +After building optimizer and scheduler and model, before training, peak GPU memory (MB): 35614 +************************* VLATrainer initialized successfully! +************************* Before trainer.fit() +Pre-train system metrics + System/Peak GPU Memory (MB)=35,614 +10/08 [16:43:56] WARNING | >> /vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py:200: UserWarning: To copy construct from a tensor, it is recommended to use warnings.py:109 + sourceTensor.detach().clone() or sourceTensor.detach().clone().requires_grad_(True), rather than torch.tensor(sourceTensor). + timestep_list = [torch.tensor(ex["timestep"], dtype=torch.int64) for ex in batch] + +!!!Training failed: stack expects each tensor to be equal size, but got [] at entry 0 and [1] at entry 1 +Traceback (most recent call last): + File "/vast/users/xiaodan/zhangjian/A1/scripts/train_for_action.py", line 593, in main + trainer.fit() + File "/vast/users/xiaodan/zhangjian/A1/olmo/train.py", line 2284, in fit + for batch in self.train_loader: + File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/utils/data/dataloader.py", line 734, in __next__ + data = self._next_data() + File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/utils/data/dataloader.py", line 790, in _next_data + data = self._dataset_fetcher.fetch(index) # may raise StopIteration + File "/vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/utils/data/_utils/fetch.py", line 43, in fetch + return self.collate_fn(data) + File "/vast/users/xiaodan/zhangjian/A1/olmo/data/collator.py", line 201, in __call__ + out['timestep'] = torch.stack(timestep_list, dim=0) +RuntimeError: stack expects each tensor to be equal size, but got [] at entry 0 and [1] at entry 1 +wandb: WARNING The `quiet` argument to `wandb.run.finish()` is deprecated, use `wandb.Settings(quiet=...)` to set this instead. diff --git a/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/files/requirements.txt b/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/files/requirements.txt new file mode 100644 index 0000000000000000000000000000000000000000..5a5e971a5d9f3b6f6a75248e203682c5fbcd69e8 --- /dev/null +++ b/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/files/requirements.txt @@ -0,0 +1,286 @@ +ai2-molmo==0.0.0 +astunparse==1.6.3 +flatbuffers==25.2.10 +gast==0.6.0 +google-pasta==0.2.0 +h5py==3.14.0 +libclang==18.1.1 +Markdown==3.9 +namex==0.1.0 +opt_einsum==3.4.0 +optree==0.17.0 +tensorboard-data-server==0.7.2 +tensorflow-io-gcs-filesystem==0.37.1 +termcolor==3.1.0 +Werkzeug==3.1.3 +Brotli==1.1.0 +Farama-Notifications==0.0.4 +MarkupSafe==2.1.5 +PyYAML==6.0.2 +absl-py==2.3.1 +accelerate==1.10.1 +ai2-molmo==0.0.0 +aiofiles==24.1.0 +aiohappyeyeballs==2.6.1 +aiohttp==3.12.15 +aiosignal==1.4.0 +annotated-types==0.7.0 +antlr4-python3-runtime==4.9.3 +anyio==4.10.0 +array_record==0.8.1 +async-timeout==5.0.1 +attrs==25.3.0 +av==15.1.0 +backports.tarfile==1.2.0 +beaker-gantry==3.2.0 +beaker-py==2.5.0 +black==23.12.1 +blinker==1.9.0 +boltons==25.0.0 +boto3==1.40.33 +botocore==1.40.33 +build==1.3.0 +cached_path==1.7.3 +cached-property==2.0.1 +cachetools==5.5.2 +certifi==2025.8.3 +cffi==2.0.0 +charset-normalizer==3.4.3 +click==8.2.1 +click-help-colors==0.9.4 +click-option-group==0.5.7 +cloudpickle==3.1.1 +cmake==4.1.0 +contourpy==1.3.2 +cryptography==46.0.1 +cycler==0.12.1 +dataclass-extensions==0.2.3 +datasets==3.6.0 +decorator==5.2.1 +deepdiff==8.6.1 +diffusers==0.35.1 +dill==0.3.8 +distro==1.9.0 +dlimp==0.0.1 +dm-tree==0.1.9 +docutils==0.22.1 +draccus==0.10.0 +editdistance==0.8.1 +einops==0.8.1 +einops-exts==0.0.4 +et_xmlfile==2.0.0 +etils==1.13.0 +evdev==1.9.2 +exceptiongroup==1.3.0 +face==24.0.0 +fastapi==0.116.2 +ffmpy==0.6.1 +fiddle==0.3.0 +filelock==3.13.1 +Flask==3.1.2 +fonttools==4.60.0 +frozenlist==1.7.0 +fsspec==2023.9.2 +ftfy==6.3.1 +gcsfs==2023.9.2 +gitdb==4.0.12 +GitPython==3.1.45 +glom==24.11.0 +google-api-core==2.25.1 +google-auth==2.40.3 +google-auth-oauthlib==1.2.2 +google-cloud-core==2.4.3 +google-cloud-storage==2.19.0 +google-crc32c==1.7.1 +google-resumable-media==2.7.2 +googleapis-common-protos==1.70.0 +gradio==5.46.0 +gradio_client==1.13.0 +graphviz==0.21 +groovy==0.1.2 +grpcio==1.75.0 +gymnasium==0.29.1 +h11==0.16.0 +hf_transfer==0.1.9 +hf-xet==1.1.10 +httpcore==1.0.9 +httpx==0.28.1 +huggingface-hub==0.35.0 +id==1.5.0 +idna==3.10 +imageio==2.37.0 +imageio-ffmpeg==0.6.0 +importlib_metadata==8.7.0 +importlib_resources==6.5.2 +iniconfig==2.1.0 +inquirerpy==0.3.4 +isort==5.12.0 +itsdangerous==2.2.0 +jaraco.classes==3.4.0 +jaraco.context==6.0.1 +jaraco.functools==4.3.0 +jeepney==0.9.0 +Jinja2==3.1.4 +jiter==0.11.0 +jmespath==1.0.1 +joblib==1.5.2 +jsonlines==4.0.0 +keras==2.15.0 +keyring==25.6.0 +kiwisolver==1.4.9 +latex2sympy2_extended==1.10.2 +lerobot==0.3.4 +Levenshtein==0.27.1 +libcst==1.8.4 +lightning-utilities==0.15.2 +markdown-it-py==4.0.0 +math-verify==0.8.0 +matplotlib==3.10.6 +mdurl==0.1.2 +mergedeep==1.3.4 +ml-dtypes==0.2.0 +ml_dtypes==0.5.3 +more-itertools==10.8.0 +mpmath==1.3.0 +msgspec==0.19.0 +multidict==6.6.4 +multiprocess==0.70.16 +mypy==1.3.0 +mypy_extensions==1.1.0 +necessary==0.4.3 +networkx==3.3 +nh3==0.3.0 +nltk==3.9.1 +numpy==1.26.4 +oauthlib==3.3.1 +omegaconf==2.3.0 +openai==1.108.0 +opencv-python-headless==4.12.0.88 +OpenEXR==3.4.0 +openpyxl==3.1.5 +orderly-set==5.5.0 +orjson==3.11.3 +packaging==25.0 +pandas==2.3.2 +pathspec==0.12.1 +petname==2.6 +pfzy==0.3.4 +pillow==11.0.0 +pip==25.2 +platformdirs==4.4.0 +pluggy==1.6.0 +promise==2.3 +prompt_toolkit==3.0.52 +propcache==0.3.2 +proto-plus==1.26.1 +protobuf==4.21.12 +protobuf==6.32.1 +psutil==7.1.0 +pyarrow==21.0.0 +pyasn1==0.6.1 +pyasn1_modules==0.4.2 +pycparser==2.23 +pydantic==2.11.9 +pydantic_core==2.33.2 +pydub==0.25.1 +Pygments==2.19.2 +pynput==1.8.1 +pyparsing==3.2.4 +pyproject_hooks==1.2.0 +pyserial==3.5 +pytest==8.4.2 +pytest-sphinx==0.6.3 +python-dateutil==2.9.0.post0 +python-Levenshtein==0.27.1 +python-multipart==0.0.20 +python-xlib==0.33 +pytorch-triton-rocm==3.4.0 +pytz==2025.2 +pyyaml-include==1.4.1 +RapidFuzz==3.14.1 +readme_renderer==44.0 +regex==2025.9.1 +requests==2.32.5 +requests-oauthlib==2.0.0 +requests-toolbelt==1.0.0 +requirements-parser==0.13.0 +rerun-sdk==0.22.1 +rfc3986==2.0.0 +rich==13.9.4 +rsa==4.9.1 +ruff==0.13.0 +s3transfer==0.14.0 +safehttpx==0.1.6 +safetensors==0.6.2 +scikit-learn==1.7.2 +scipy==1.15.3 +SecretStorage==3.4.0 +semantic-version==2.10.0 +sentencepiece==0.2.1 +sentry-sdk==2.38.0 +setuptools==78.1.1 +shellingham==1.5.4 +six==1.17.0 +smart_open==7.3.1 +smashed==0.21.5 +smmap==5.0.2 +sniffio==1.3.1 +starlette==0.48.0 +sympy==1.13.3 +tensorboard==2.15.2 +tensorboard==2.19.0 +tensorflow==2.15.0 +tensorflow-addons==0.23.0 +tensorflow-datasets==4.9.3 +tensorflow-estimator==2.15.0 +tensorflow-graphics==2021.12.3 +tensorflow-metadata==1.17.2 +threadpoolctl==3.6.0 +timm==1.0.19 +tokenizers==0.22.0 +toml==0.10.2 +tomli==2.2.1 +tomlkit==0.13.3 +torch==2.8.0+rocm6.4 +torchcodec==0.5 +torchmetrics==1.8.2 +torchvision==0.23.0+rocm6.4 +tqdm==4.67.1 +transformers==4.56.1 +trimesh==4.8.2 +trouting==0.3.3 +twine==6.2.0 +typeguard==2.13.3 +typer==0.17.4 +typing_extensions==4.15.0 +typing-inspect==0.9.0 +typing-inspection==0.4.1 +tzdata==2025.2 +urllib3==2.5.0 +uvicorn==0.35.0 +wandb==0.21.4 +wcwidth==0.2.13 +websockets==15.0.1 +wheel==0.45.1 +wrapt==1.14.2 +xxhash==3.5.0 +yarl==1.20.1 +zipp==3.23.0 +lerobot==0.3.4 +minLoRA==0.1.0 +autocommand==2.2.2 +backports.tarfile==1.2.0 +importlib_metadata==8.0.0 +inflect==7.3.1 +jaraco.collections==5.1.0 +jaraco.context==5.3.0 +jaraco.functools==4.0.1 +jaraco.text==3.12.1 +more-itertools==10.3.0 +packaging==24.2 +platformdirs==4.2.2 +tomli==2.0.1 +typeguard==4.3.0 +typing_extensions==4.12.2 +wheel==0.45.1 +zipp==3.19.2 diff --git a/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/files/wandb-metadata.json b/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/files/wandb-metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..9140a43346a93ec6c5022eb91109b87809f6028b --- /dev/null +++ b/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/files/wandb-metadata.json @@ -0,0 +1,204 @@ +{ + "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35", + "python": "CPython 3.10.18", + "startedAt": "2025-10-08T16:38:31.938958Z", + "args": [ + "qwen2_7b", + "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk_l1_regression", + "--vision_backbone", + "openai", + "--action_head", + "l1_regression", + "--seq_len", + "1600", + "--ft_llm", + "--checkpoint", + "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924", + "--device_train_microbatch_size", + "16", + "--global_batch_size", + "126", + "--dataset", + "vla_dataset_realworld", + "--llm_learning_rate", + "5e-5", + "--wandb_entity", + "henryeap", + "--wandb_project", + "a1-realworld", + "--wandb_run_name", + "cleandesk", + "--real_world_vla_config_path", + "vla_config_realworld/vla_config_cleandesk.yaml", + "--save_overwrite" + ], + "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py", + "codePath": "launch_scripts/train_vla.py", + "codePathLocal": "launch_scripts/train_vla.py", + "git": { + "remote": "https://github.com/Spatialtemporal-AI/A1.git", + "commit": "49712a42d21a8c739a16ba5eeaec4a0d7b29ab80" + }, + "email": "ihenrykwok@outlook.com", + "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/cleandesk_l1_regression/wandb", + "host": "auh7-1b-gpu-316", + "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10", + "cpu_count": 64, + "cpu_count_logical": 128, + "gpu": "Instinct MI210", + "gpu_count": 8, + "disk": { + "/": { + "total": "470343073792", + "used": "50668195840" + } + }, + "memory": { + "total": "2434606952448" + }, + "gpu_amd": [ + { + "id": "3", + "uniqueId": "0x62b25d667064a7ff", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "6", + "uniqueId": "0xbdb93fac1aa97618", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "7", + "uniqueId": "0x850c5a1ff5d005be", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "2", + "uniqueId": "0x7a3e2781f4182456", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "4", + "uniqueId": "0x4c21a2ad76408df6", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "0", + "uniqueId": "0xa8d2c33980704bf2", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "1", + "uniqueId": "0xd13265721a117b54", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "5", + "uniqueId": "0x19ee82506963794b", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + } + ], + "slurm": { + "cluster_name": "ai-04r", + "conf": "/etc/slurm/slurm.conf", + "cpus_on_node": "128", + "gpus_on_node": "8", + "gtids": "0", + "job_account": "faculty-acc", + "job_cpus_per_node": "128", + "job_end_time": "1760200645", + "job_gid": "2000", + "job_gpus": "0,1,2,3,4,5,6,7", + "job_id": "2282", + "job_name": "mh_cleandesk_l1_regression", + "job_nodelist": "auh7-1b-gpu-316", + "job_num_nodes": "1", + "job_partition": "faculty", + "job_qos": "xdqos", + "job_start_time": "1759941445", + "job_uid": "2013", + "job_user": "xiaodan", + "jobid": "2282", + "localid": "0", + "nnodes": "1", + "nodeid": "0", + "nodelist": "auh7-1b-gpu-316", + "nprocs": "1", + "ntasks": "1", + "ntasks_per_node": "1", + "oom_kill_step": "0", + "prio_process": "0", + "procid": "0", + "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts", + "submit_host": "auh-1b-cpu-login-001", + "task_pid": "1925818", + "tasks_per_node": "1", + "topology_addr": "auh7-1b-gpu-316", + "topology_addr_pattern": "node" + }, + "writerId": "9zghejqbkg668a368vduhoyzhbv4wgq6" +} \ No newline at end of file diff --git a/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/files/wandb-summary.json b/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/files/wandb-summary.json new file mode 100644 index 0000000000000000000000000000000000000000..69b102977bc590ee6a0c3e2b05c8ab9c83e0d62f --- /dev/null +++ b/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/files/wandb-summary.json @@ -0,0 +1 @@ +{"_step":0,"System/Peak GPU Memory (MB)":35614.78125,"_timestamp":1.7599418260827e+09,"_wandb":{"runtime":325},"_runtime":325.049768384} \ No newline at end of file diff --git a/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/logs/debug-core.log b/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/logs/debug-core.log new file mode 100644 index 0000000000000000000000000000000000000000..b567c8ed97dfdc071643e8ab5622283163027bdf --- /dev/null +++ b/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/logs/debug-core.log @@ -0,0 +1,16 @@ +{"time":"2025-10-08T16:38:32.182353704Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpl72x4viw/port-1926008.txt","pid":1926008,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false} +{"time":"2025-10-08T16:38:32.183512473Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":1926008} +{"time":"2025-10-08T16:38:32.184652392Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-1926008-1926185-2566029014/socket","Net":"unix"}} +{"time":"2025-10-08T16:38:32.187758092Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"} +{"time":"2025-10-08T16:38:32.198021978Z","level":"INFO","msg":"handleInformInit: received","streamId":"76mxu43t","id":"1(@)"} +{"time":"2025-10-08T16:38:33.339879992Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"76mxu43t","id":"1(@)"} +{"time":"2025-10-08T16:44:00.126902419Z","level":"INFO","msg":"handleInformFinish: finish message received","streamId":"76mxu43t","id":"1(@)"} +{"time":"2025-10-08T16:44:00.130282224Z","level":"INFO","msg":"handleInformFinish: stream closed","streamId":"76mxu43t","id":"1(@)"} +{"time":"2025-10-08T16:44:00.192589494Z","level":"INFO","msg":"handleInformTeardown: server teardown initiated","id":"1(@)"} +{"time":"2025-10-08T16:44:00.192627935Z","level":"INFO","msg":"handleInformTeardown: server shutdown complete","id":"1(@)"} +{"time":"2025-10-08T16:44:00.192634215Z","level":"INFO","msg":"server is shutting down"} +{"time":"2025-10-08T16:44:00.192643625Z","level":"INFO","msg":"connection: closing","id":"1(@)"} +{"time":"2025-10-08T16:44:00.192695596Z","level":"INFO","msg":"connection: closed successfully","id":"1(@)"} +{"time":"2025-10-08T16:44:00.192701166Z","level":"INFO","msg":"connection: ManageConnectionData: connection closed","id":"1(@)"} +{"time":"2025-10-08T16:44:00.192695596Z","level":"INFO","msg":"server: listener closed","addr":{"Name":"/tmp/wandb-1926008-1926185-2566029014/socket","Net":"unix"}} +{"time":"2025-10-08T16:44:00.192730717Z","level":"INFO","msg":"server is closed"} diff --git a/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/logs/debug-internal.log b/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/logs/debug-internal.log new file mode 100644 index 0000000000000000000000000000000000000000..46affc2ba51fb5f59733037d81f939926d62e073 --- /dev/null +++ b/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/logs/debug-internal.log @@ -0,0 +1,12 @@ +{"time":"2025-10-08T16:38:32.19998745Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"} +{"time":"2025-10-08T16:38:33.339827981Z","level":"INFO","msg":"stream: created new stream","id":"76mxu43t"} +{"time":"2025-10-08T16:38:33.339874102Z","level":"INFO","msg":"stream: started","id":"76mxu43t"} +{"time":"2025-10-08T16:38:33.339905492Z","level":"INFO","msg":"handler: started","stream_id":"76mxu43t"} +{"time":"2025-10-08T16:38:33.339893552Z","level":"INFO","msg":"writer: started","stream_id":"76mxu43t"} +{"time":"2025-10-08T16:38:33.339947873Z","level":"INFO","msg":"sender: started","stream_id":"76mxu43t"} +{"time":"2025-10-08T16:43:58.756754711Z","level":"INFO","msg":"handler: operation stats","stats":{"operations":[{"desc":"updating run metadata","runtime_seconds":0.006574606}],"total_operations":1}} +{"time":"2025-10-08T16:43:59.766243448Z","level":"INFO","msg":"fileTransfer: Close: file transfer manager closed"} +{"time":"2025-10-08T16:44:00.127335826Z","level":"INFO","msg":"stream: closing","id":"76mxu43t"} +{"time":"2025-10-08T16:44:00.127349836Z","level":"INFO","msg":"handler: closed","stream_id":"76mxu43t"} +{"time":"2025-10-08T16:44:00.128408003Z","level":"INFO","msg":"sender: closed","stream_id":"76mxu43t"} +{"time":"2025-10-08T16:44:00.128424754Z","level":"INFO","msg":"stream: closed","id":"76mxu43t"} diff --git a/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/logs/debug.log b/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/logs/debug.log new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/run-76mxu43t.wandb b/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/run-76mxu43t.wandb new file mode 100644 index 0000000000000000000000000000000000000000..49d39f7008e1971826bac0323d4ccea4f0cf035a --- /dev/null +++ b/cleandesk_l1_regression/wandb/wandb/run-20251008_163831-76mxu43t/run-76mxu43t.wandb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:592c2180c1f58861cad10bcce3042c15f3fa428cb470d5da0ac15865d108e860 +size 205758 diff --git a/eraser_flow_matching/step11500-action-head/metadata.pt b/eraser_flow_matching/step11500-action-head/metadata.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e34304d65d6217c2b0a33ee0a75ccecc5e8f82c --- /dev/null +++ b/eraser_flow_matching/step11500-action-head/metadata.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fb72b6306ce04d1beb20bb289509f00c39a40845ff7c4b36bf4deb4e83fe82a +size 1331 diff --git a/eraser_flow_matching/step12000-action-head/metadata.pt b/eraser_flow_matching/step12000-action-head/metadata.pt new file mode 100644 index 0000000000000000000000000000000000000000..752c8b547c4cac7f78746ac5066032167b1cf3c1 --- /dev/null +++ b/eraser_flow_matching/step12000-action-head/metadata.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:995307502120af3866f237cd0bc484fc848a652539d28e53cbea882abc16ba6b +size 1331 diff --git a/eraser_flow_matching/step12000-unsharded/config.yaml b/eraser_flow_matching/step12000-unsharded/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..bcdc1e14f2d420fe1d72bf11ddd06055bee54a43 --- /dev/null +++ b/eraser_flow_matching/step12000-unsharded/config.yaml @@ -0,0 +1,322 @@ +run_name: eraser_20251011_163756 +seed: 6198 +epoch: null +dry_run: false +model: + d_model: 3584 + n_heads: 28 + n_kv_heads: 4 + qkv_bias: true + clip_qkv: null + n_layers: 28 + mlp_ratio: 4 + mlp_hidden_size: 37888 + activation_type: swiglu + block_type: sequential + block_group_size: 1 + rope: true + rope_full_precision: true + rope_theta: 1000000.0 + vision_backbone: + image_model_type: openai + image_default_input_size: + - 336 + - 336 + image_patch_size: 14 + image_pos_patch_size: 14 + image_emb_dim: 1024 + image_num_heads: 16 + image_num_key_value_heads: 16 + image_num_layers: 23 + image_head_dim: 64 + image_mlp_dim: 4096 + image_mlp_activations: quick_gelu + image_dropout_rate: 0.0 + image_num_pos: 577 + image_norm_eps: 1.0e-05 + attention_dropout: 0.0 + residual_dropout: 0.0 + initializer_range: 0.02 + fsdp_wrap: false + resize_mode: default + vit_load_path: /weka/oe-training-default/mm-olmo/pretrained_image_encoders/vit-l-14-336.pt + llm_load_path: /weka/oe-training-default/mm-olmo/pretrained_llms/qwen2-7b.pt + low_cpu_fsdp: true + attention_type: sdpa + float32_attention: true + attention_dropout: 0.0 + attention_layer_norm: false + residual_dropout: 0.1 + response_residual_dropout: 0.0 + embedding_dropout: 0.0 + layer_norm_type: rms + layer_norm_with_affine: true + layer_norm_eps: 1.0e-06 + attention_layer_norm_with_affine: true + max_sequence_length: 4096 + max_position_embeddings: null + include_bias: false + bias_for_layer_norm: null + scale_logits: false + vocab_size: 152064 + embedding_size: 152064 + ff_out_size: null + additional_vocab_size: 128 + new_embedding_init_range: 0.02 + weight_tying: false + init_device: null + init_fn: normal + init_std: 0.02 + init_cutoff_factor: null + norm_after: false + precision: amp_bf16 + max_crops: 12 + crop_mode: overlap-and-resize-c2 + use_col_tokens: true + prompt_type: uber_model + system_prompt_kind: demo_or_style + message_formatting: role + always_start_with_space: true + multi_annotation_weighting: root_subsegments + default_inference_len: 65 + overlap_margins: + - 4 + - 4 + pad_value: 0.0 + image_padding_embed: pad_and_partial_pad + fix_image_padding: true + vit_layers: + - -2 + - -9 + image_pooling_h: 2 + image_pooling_w: 2 + image_pooling_2d: attention_meanq + image_projector: mlp + image_feature_dropout: 0.0 + initializer_range: 0.02 + normalize_input_embeds: false + use_position_ids: true + head_dim: null + action_tokenizer: + identifier: physical-intelligence/fast + tokenizer_dir: null + action_dim: 7 + horizon: 8 + tokenizer: + identifier: Qwen/Qwen2-7B + tokenizer_dir: null + pad_tokenizer: true + moe_num_experts: 8 + moe_top_k: 2 + moe_mlp_impl: sparse + moe_log_expert_assignment: false + moe_shared_expert: false + moe_lbl_in_fp32: false + moe_interleave: false + moe_loss_weight: 0.1 + moe_zloss_weight: null + moe_dropless: true + moe_capacity_factor: 1.25 + action_head: flow_matching + num_diffusion_steps: 1000 + num_diffusion_inference_steps: 30 + use_proprio: true + action_head_dit_hidden_size: 1152 + action_head_dit_depth: 28 + action_head_dit_num_heads: 16 + llm_causal_attention: false + action_use_left_eef: true + action_use_mobile_base: false +allow_resume: false +ft_llm: true +ft_vit: false +ft_connector: false +ft_embedding: lm_head +lora: false +use_lora: false +lora_rank: 8 +lora_llm: false +lora_vit: false +lora_connector: false +early_exit: false +train_exit_random_layer: false +optimizer: + name: adamw + learning_rate: 0.0001 + weight_decay: 0.01 + betas: + - 0.9 + - 0.95 + eps: 1.0e-05 + connector_learning_rate: 0.0002 + vit_learning_rate: 6.0e-06 + llm_learning_rate: 5.0e-05 + connector_weight_decay: 0.0 + vit_weight_decay: 0.0 + llm_weight_decay: 0.0 + connector_betas: + - 0.9 + - 0.95 + vit_betas: + - 0.9 + - 0.95 + llm_betas: + - 0.9 + - 0.95 + connector_eps: 1.0e-06 + vit_eps: 1.0e-06 + llm_eps: 1.0e-06 + metrics_log_interval: 20 +scheduler: + name: multimodal + units: steps + t_warmup: 100 + t_max: null + alpha_f: 0.1 + connector_t_warmup: 200 + vit_t_warmup: 2000 + llm_t_warmup: 2000 + grad_clip_warmup_steps: null + grad_clip_warmup_factor: null + warmup_min_lr: 0.0 +data: + dataset: vla_dataset_realworld + mixture: null + root_size_mixture: null + split: train + seed: 95818 + shuffle_messages: false + pad: to_max + sequence_length: 1600 + shuffle: true + for_inference: false + multi_modal: torch + num_workers: 0 + drop_last: true + pin_memory: true + prefetch_factor: null + persistent_workers: false + timeout: 0 + rlds_dataset_name: a1_real_world + rlds_data_root_dir: /vast/users/xiaodan/zhangjian/datasets/OXE + use_wrist_image: true + use_proprio: true + rlds_shuffle_buffer_size: 100000 + rlds_traj_threads: 8 + rlds_read_threads: 8 + lerobot_episode_index_start: null + lerobot_episode_index_end: null +restore_dataloader: true +fast_forward_batches: null +evaluators: +- label: val + data: + dataset: vla_dataset_realworld + mixture: null + root_size_mixture: null + split: validation + seed: null + shuffle_messages: false + pad: to_max + sequence_length: 1600 + shuffle: false + for_inference: false + multi_modal: torch + num_workers: 0 + drop_last: true + pin_memory: true + prefetch_factor: null + persistent_workers: true + timeout: 0 + rlds_dataset_name: libero_4_task_suites_no_noops + rlds_data_root_dir: /mnt/data/zhangjian/dataset/Simulation/datasets--openvla--modified_libero_rlds + use_wrist_image: true + use_proprio: true + rlds_shuffle_buffer_size: 256000 + rlds_traj_threads: 8 + rlds_read_threads: 8 + lerobot_episode_index_start: 353 + lerobot_episode_index_end: 765 + device_eval_batch_size: null + subset_num_batches: 64 + max_examples: null + max_new_tokens: 448 + mm_evaluator: null + save_dir: null + save_to_checkpoint_dir: false + eval_name: null + skip_if_metrics_cached: true +eval_interval: 0 +inf_eval_interval: -1 +inf_evaluators: [] +save_folder: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/eraser_flow_matching +remote_save_folder: null +canceled_check_interval: 50 +save_interval: 500 +save_interval_unsharded: 500 +save_interval_ephemeral: null +save_interval_action_head: 500 +save_num_checkpoints_to_keep: 1 +save_num_unsharded_checkpoints_to_keep: 1 +save_num_action_head_checkpoints_to_keep: 2 +save_overwrite: true +force_save_unsharded: false +no_pre_train_checkpoint: true +initial_model_checkpoint: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924 +load_model_config: null +checkpoint_dir: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924 +load_path: null +load_path_sharded_checkpointer: null +reset_optimizer_state: false +reset_trainer_state: false +save_dataloader_state: false +reset_dataloader_state: false +keep_lr_on_load: true +sharded_checkpointer: torch_legacy +max_duration: 500000 +global_train_batch_size: 126 +device_train_batch_size: 15 +device_train_microbatch_size: 16 +device_eval_batch_size: 4 +eval_subset_num_batches: -1 +eval_on_load: false +device_inf_eval_batch_size: 16 +inf_eval_subset_num_batches: -1 +device_train_grad_accum: 0 +max_grad_norm: 1.0 +multi_component_grad_norm: true +batch_divisor: global_batch +max_grad_norm_ratio: null +precision: amp_bf16 +wandb: + project: a1-realworld + entity: henryeap + group: null + name: eraser_20251011_163756 + tags: + - watching + log_artifacts: false + rank_zero_only: true + log_interval: 1 +speed_monitor: + window_size: 20 + gpu_flops_available: null +console_log_interval: 1 +gen1_gc_interval: 1 +compile: null +fsdp: + use_orig_params: true + sharding_strategy: FULL_SHARD + wrapping_strategy: by_block_and_size + precision: float + hybrid_sharding_num_model_replicas: null +softmax_auxiliary_loss: true +softmax_auxiliary_loss_scale: 0.0001 +time_limit: null +extra_steps_after_cancel: 10 +python_profiling: false +torch_profiling: false +stop_at: 500000 +stop_after: null +activation_checkpointing: whole_layer +fused_loss: null diff --git a/eraser_flow_matching/step12000-unsharded/train.pt b/eraser_flow_matching/step12000-unsharded/train.pt new file mode 100644 index 0000000000000000000000000000000000000000..8eb1983d5bcb82b04ff09881957f3a2e876fad16 --- /dev/null +++ b/eraser_flow_matching/step12000-unsharded/train.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27b7944a86ee4e879d03cec156d2128c480602778b651762977174d39e5f94ab +size 15061 diff --git a/eraser_flow_matching/wandb/wandb/debug-internal.log b/eraser_flow_matching/wandb/wandb/debug-internal.log new file mode 100644 index 0000000000000000000000000000000000000000..eb290784ac6ab6aaf91849ad696f7d4596c50668 --- /dev/null +++ b/eraser_flow_matching/wandb/wandb/debug-internal.log @@ -0,0 +1,8 @@ +{"time":"2025-10-11T16:38:32.587302182Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"} +{"time":"2025-10-11T16:38:33.732885593Z","level":"INFO","msg":"stream: created new stream","id":"yqnt28c8"} +{"time":"2025-10-11T16:38:33.732932354Z","level":"INFO","msg":"stream: started","id":"yqnt28c8"} +{"time":"2025-10-11T16:38:33.732959824Z","level":"INFO","msg":"writer: started","stream_id":"yqnt28c8"} +{"time":"2025-10-11T16:38:33.732985135Z","level":"INFO","msg":"handler: started","stream_id":"yqnt28c8"} +{"time":"2025-10-11T16:38:33.732961384Z","level":"INFO","msg":"sender: started","stream_id":"yqnt28c8"} +{"time":"2025-10-13T08:15:22.219814038Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"} +{"time":"2025-10-13T20:01:35.03758236Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded"} diff --git a/eraser_flow_matching/wandb/wandb/debug.log b/eraser_flow_matching/wandb/wandb/debug.log new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/files/output.log b/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/files/output.log new file mode 100644 index 0000000000000000000000000000000000000000..40164e22b0cc4306246cd35ae508168e96feb936 --- /dev/null +++ b/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/files/output.log @@ -0,0 +1,62401 @@ +wandb: Detected [openai] in use. +wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script. +wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/ +10/11 [16:38:34] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109 + device id is provided via `init_process_group` or `barrier `. Using the current device set by the user. + warnings.warn( # warn only once + +****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Eraser', 8, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 8, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 8, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}} +****** Skip RLDS main; path not found: None +****** start build LeRobot main... +build_tokenizer, cache_dir None tokenizer_dir None +10/11 [16:38:36] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:130 + INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:438 +****** before LeRobot dataset... +****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Eraser +camera_keys: ['image', 'hand_left_image', 'hand_right_image'], state_key: state, action_key: actions +****** length of the dataset: 13441 +10/11 [16:38:38] INFO | >> build_rlds_train_dataset: Loading train dataset: vla_dataset_realworld/train __init__.py:521 +****** Import RLDSBatchTransform, RLDSDataset successfully. +****** before RLDS dataset... +****** data_config.rlds_dataset_name: a1_real_world +****** data_config.rlds_data_root_dir: /vast/users/xiaodan/zhangjian/datasets/OXE +214************** +10/11 [16:38:39] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/fractal20220817_data/0.1.0/dataset_statistics_138513de447c9e5435c5a12cc1c4a3c6a6434524fbd28f4 + 5463261fac12cf3fb.json. +214************** +10/11 [16:38:40] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/jaco_play/0.1.0/dataset_statistics_e081d4716a3da95df91c79d661ae59fa26a43da49db4bf8d716b622b56 + 3b0ea3.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/berkeley_cable_routing/0.1.0/dataset_statistics_08cb4c5b7c5e6c035fc84ea85b2d54c0c46ad608a8763 + 4ebb18374088d23cd76.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/viola/0.1.0/dataset_statistics_2415d8f7de73c8761fedd7c2a9590667fb0d3fdd26664bf4c100222e5cdb89 + b9.json. +214************** +10/11 [16:38:41] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/berkeley_autolab_ur5/0.1.0/dataset_statistics_1b798b015e7b2c4e4396719e3aa4d43a2f400b2edf5dbb0 + 820cb3df6943d8ddc.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/austin_buds_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_ccecde24cc01793b221 + 4eb0c4c5d7cc0e3ccc623db99bd892b83552b20decfb7.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/nyu_franka_play_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_b0d79557eac3059 + ebf9f679a8f044bd60403f0cba16a37e0df2fe1654416ffe7.json. +214************** +10/11 [16:38:42] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/furniture_bench_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_76735bab3752978 + bef83e1341d3c8db0a0d5a10397247eb3e0459388dccfe698.json. +214************** +10/11 [16:38:43] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/austin_sailor_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_4127c515a9413766f + e40ac696d884550bc655a40952ef3ae457c404d31570123.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/austin_sirius_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_cb2e0273f80029a19 + dc3dbb3a3a4118a5598e7bff3ff0245891255825b04b42a.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/dlr_edan_shared_control_converted_externally_to_rlds/0.1.0/dataset_statistics_b8984563fc3e7ea + c0803c667ef58c9deaf2e747683568306ea1d83505d532a76.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/utaustin_mutex/0.1.0/dataset_statistics_0a99ee5a8ce4a34ba018a7c0c742a1b74ab7abb7d7a3925f8596a + 3fc4eb8efc7.json. +214************** +10/11 [16:38:44] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/berkeley_fanuc_manipulation/0.1.0/dataset_statistics_a98d349d0364668095ea3ca38c6785e94f35e5e5 + 8e234c88fac83775a923b0d0.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/bc_z/0.1.0/dataset_statistics_8187209d5cb273687cc8666697219dae50914ae2bee7f03552bd85a91fcfe7a + 4.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/roboturk/0.1.0/dataset_statistics_3aa821e17a2937f941d4102cfadcb1154853cb45dcec07ccc66893b01f6 + f1b40.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/toto/0.1.0/dataset_statistics_505a51eb76e85fe0969e8e70e45fb8c9ae5d3b1fae2851c7899bea91f74b979 + 0.json. +214************** +10/11 [16:38:45] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/ucsd_kitchen_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_1f1a5f310a2d5a6edc + 0e217370e135c8c8598290f11f57025037adcb0d033926.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/iamlab_cmu_pickup_insert_converted_externally_to_rlds/0.1.0/dataset_statistics_698a1f892f8866 + af9cb4bd5a23611fa44d8c7d9d816f9b3049d2fc3b62442079.json. + +###################################################################################### +# Loading the following 18 datasets (incl. sampling weight): # +# fractal20220817_data: ====================================================0.529250 # +# jaco_play: ===============================================================0.010898 # +# berkeley_cable_routing: ==================================================0.005916 # +# viola: ===================================================================0.021337 # +# berkeley_autolab_ur5: ====================================================0.027379 # +# austin_buds_dataset_converted_externally_to_rlds: ========================0.004768 # +# nyu_franka_play_dataset_converted_externally_to_rlds: ====================0.018817 # +# furniture_bench_dataset_converted_externally_to_rlds: ====================0.055185 # +# austin_sailor_dataset_converted_externally_to_rlds: ======================0.049354 # +# austin_sirius_dataset_converted_externally_to_rlds: ======================0.039129 # +# dlr_edan_shared_control_converted_externally_to_rlds: ====================0.001248 # +# utaustin_mutex: ==========================================================0.050583 # +# berkeley_fanuc_manipulation: =============================================0.017504 # +# bc_z: ====================================================================0.168166 # +# roboturk: ================================================================0.000131 # +# toto: ====================================================================0.000228 # +# ucsd_kitchen_dataset_converted_externally_to_rlds: =======================0.000006 # +# iamlab_cmu_pickup_insert_converted_externally_to_rlds: ===================0.000102 # +###################################################################################### + + INFO | >> [*] Threads per Dataset: [14 1 1 1 1 1 1 2 1 1 1 1 1 5 1 1 1 1] dataset.py:563 + INFO | >> [*] Reads per Dataset: [14 1 1 1 1 1 1 2 1 1 1 1 1 5 1 1 1 1] dataset.py:564 + INFO | >> [*] Constructing datasets... dataset.py:567 +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +10/11 [16:38:50] INFO | >> [*] Applying frame transforms on dataset... dataset.py:607 +****** after RLDSDataset initialization! +****** length of the dataset: 7154275 +****** Build rlds train dataset: IterableDatasetWrapper successfully. +****** path: None +****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None +****** After build vla train dataset... +****** iterable_sources: [, ] +****** Before build mixed iterable dataset... +****** Build vla train dataloader successfully! +************************* Build train_dataloader successful! +************************* Before build_inf_evaluators + WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109 + device id is provided via `init_process_group` or `barrier `. Using the current device set by the user. + warnings.warn( # warn only once + +************************* Build evaluators successful! +************************* Early exit flags: early_exit=False +PROPRIO_DIM 16 does not match ACTION_DIM 16 for AffordVLA +************************* Initialize model successful! +***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt +***** Load checkpoint successful! +missing keys: ['action_head.state_proj.weight', 'action_head.state_proj.bias', 'action_head.action_in_proj.weight', 'action_head.action_in_proj.bias', 'action_head.action_time_in.weight', 'action_head.action_time_in.bias', 'action_head.action_time_out.weight', 'action_head.action_time_out.bias', 'action_head.memory_proj.weight', 'action_head.memory_proj.bias', 'action_head.gemma.model.layers.0.self_attn.q_proj.weight', 'action_head.gemma.model.layers.0.self_attn.k_proj.weight', 'action_head.gemma.model.layers.0.self_attn.v_proj.weight', 'action_head.gemma.model.layers.0.self_attn.o_proj.weight', 'action_head.gemma.model.layers.0.mlp.gate_proj.weight', 'action_head.gemma.model.layers.0.mlp.up_proj.weight', 'action_head.gemma.model.layers.0.mlp.down_proj.weight', 'action_head.gemma.model.layers.0.input_layernorm.weight', 'action_head.gemma.model.layers.0.post_attention_layernorm.weight', 'action_head.gemma.model.layers.1.self_attn.q_proj.weight', 'action_head.gemma.model.layers.1.self_attn.k_proj.weight', 'action_head.gemma.model.layers.1.self_attn.v_proj.weight', 'action_head.gemma.model.layers.1.self_attn.o_proj.weight', 'action_head.gemma.model.layers.1.mlp.gate_proj.weight', 'action_head.gemma.model.layers.1.mlp.up_proj.weight', 'action_head.gemma.model.layers.1.mlp.down_proj.weight', 'action_head.gemma.model.layers.1.input_layernorm.weight', 'action_head.gemma.model.layers.1.post_attention_layernorm.weight', 'action_head.gemma.model.layers.2.self_attn.q_proj.weight', 'action_head.gemma.model.layers.2.self_attn.k_proj.weight', 'action_head.gemma.model.layers.2.self_attn.v_proj.weight', 'action_head.gemma.model.layers.2.self_attn.o_proj.weight', 'action_head.gemma.model.layers.2.mlp.gate_proj.weight', 'action_head.gemma.model.layers.2.mlp.up_proj.weight', 'action_head.gemma.model.layers.2.mlp.down_proj.weight', 'action_head.gemma.model.layers.2.input_layernorm.weight', 'action_head.gemma.model.layers.2.post_attention_layernorm.weight', 'action_head.gemma.model.layers.3.self_attn.q_proj.weight', 'action_head.gemma.model.layers.3.self_attn.k_proj.weight', 'action_head.gemma.model.layers.3.self_attn.v_proj.weight', 'action_head.gemma.model.layers.3.self_attn.o_proj.weight', 'action_head.gemma.model.layers.3.mlp.gate_proj.weight', 'action_head.gemma.model.layers.3.mlp.up_proj.weight', 'action_head.gemma.model.layers.3.mlp.down_proj.weight', 'action_head.gemma.model.layers.3.input_layernorm.weight', 'action_head.gemma.model.layers.3.post_attention_layernorm.weight', 'action_head.gemma.model.layers.4.self_attn.q_proj.weight', 'action_head.gemma.model.layers.4.self_attn.k_proj.weight', 'action_head.gemma.model.layers.4.self_attn.v_proj.weight', 'action_head.gemma.model.layers.4.self_attn.o_proj.weight', 'action_head.gemma.model.layers.4.mlp.gate_proj.weight', 'action_head.gemma.model.layers.4.mlp.up_proj.weight', 'action_head.gemma.model.layers.4.mlp.down_proj.weight', 'action_head.gemma.model.layers.4.input_layernorm.weight', 'action_head.gemma.model.layers.4.post_attention_layernorm.weight', 'action_head.gemma.model.layers.5.self_attn.q_proj.weight', 'action_head.gemma.model.layers.5.self_attn.k_proj.weight', 'action_head.gemma.model.layers.5.self_attn.v_proj.weight', 'action_head.gemma.model.layers.5.self_attn.o_proj.weight', 'action_head.gemma.model.layers.5.mlp.gate_proj.weight', 'action_head.gemma.model.layers.5.mlp.up_proj.weight', 'action_head.gemma.model.layers.5.mlp.down_proj.weight', 'action_head.gemma.model.layers.5.input_layernorm.weight', 'action_head.gemma.model.layers.5.post_attention_layernorm.weight', 'action_head.gemma.model.layers.6.self_attn.q_proj.weight', 'action_head.gemma.model.layers.6.self_attn.k_proj.weight', 'action_head.gemma.model.layers.6.self_attn.v_proj.weight', 'action_head.gemma.model.layers.6.self_attn.o_proj.weight', 'action_head.gemma.model.layers.6.mlp.gate_proj.weight', 'action_head.gemma.model.layers.6.mlp.up_proj.weight', 'action_head.gemma.model.layers.6.mlp.down_proj.weight', 'action_head.gemma.model.layers.6.input_layernorm.weight', 'action_head.gemma.model.layers.6.post_attention_ +unexpected keys: [] +************************* Initialize model successful! +************************* Before FSDP model wrapping +************************* FSDP model wrapping successful! +************************* Before building optimizer and scheduler +10/11 [16:40:34] INFO | >> Constructing optimizer with 2 param groups optim.py:1283 +************************************************** +After building optimizer and scheduler and model, before training, peak GPU memory (MB): 36856 +************************* VLATrainer initialized successfully! +************************* Before trainer.fit() +Pre-train system metrics + System/Peak GPU Memory (MB)=36,856 +10/11 [16:41:04] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/nn/modules/module.py:967: UserWarning: The .grad attribute warnings.py:109 + of a Tensor that is not a leaf Tensor is being accessed. Its .grad attribute won't be populated during autograd.backward(). If you indeed + want the .grad field to be populated for a non-leaf Tensor, use .retain_grad() on the non-leaf Tensor. If you access the non-leaf Tensor + by mistake, make sure you access the leaf Tensor instead. See github.com/pytorch/pytorch/pull/30531 for more informations. (Triggered + internally at /pytorch/build/aten/src/ATen/core/TensorBody.h:489.) + param_grad = param.grad + +[step=1/500000] + train/ActionNoiseL2Loss=1.586 + throughput/total_tokens=192,000 + System/Peak GPU Memory (MB)=44,240 +[step=2/500000] + train/ActionNoiseL2Loss=1.529 + throughput/total_tokens=384,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,055 +[step=3/500000] + train/ActionNoiseL2Loss=1.609 + throughput/total_tokens=576,000 + throughput/device/tokens_per_second=1,119 + throughput/device/batches_per_second=0.0467 +[step=4/500000] + train/ActionNoiseL2Loss=1.598 + throughput/total_tokens=768,000 + throughput/device/tokens_per_second=1,112 + throughput/device/batches_per_second=0.0463 +[step=5/500000] + train/ActionNoiseL2Loss=1.489 + throughput/total_tokens=960,000 + throughput/device/tokens_per_second=1,119 + throughput/device/batches_per_second=0.0466 +[step=6/500000] + train/ActionNoiseL2Loss=1.489 + throughput/total_tokens=1,152,000 + throughput/device/tokens_per_second=1,123 + throughput/device/batches_per_second=0.0468 +[step=7/500000] + train/ActionNoiseL2Loss=1.414 + throughput/total_tokens=1,344,000 + throughput/device/tokens_per_second=1,127 + throughput/device/batches_per_second=0.0470 +[step=8/500000] + train/ActionNoiseL2Loss=1.397 + throughput/total_tokens=1,536,000 + throughput/device/tokens_per_second=1,129 + throughput/device/batches_per_second=0.0471 +[step=9/500000] + train/ActionNoiseL2Loss=1.379 + throughput/total_tokens=1,728,000 + throughput/device/tokens_per_second=1,130 + throughput/device/batches_per_second=0.0471 +[step=10/500000] + train/ActionNoiseL2Loss=1.263 + throughput/total_tokens=1,920,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 + System/Peak GPU Memory (MB)=51,073 +[step=11/500000] + train/ActionNoiseL2Loss=1.276 + throughput/total_tokens=2,112,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=12/500000] + train/ActionNoiseL2Loss=1.264 + throughput/total_tokens=2,304,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=13/500000] + train/ActionNoiseL2Loss=1.166 + throughput/total_tokens=2,496,000 + throughput/device/tokens_per_second=1,136 + throughput/device/batches_per_second=0.0474 +[step=14/500000] + train/ActionNoiseL2Loss=1.249 + throughput/total_tokens=2,688,000 + throughput/device/tokens_per_second=1,137 + throughput/device/batches_per_second=0.0474 +[step=15/500000] + train/ActionNoiseL2Loss=1.287 + throughput/total_tokens=2,880,000 + throughput/device/tokens_per_second=1,137 + throughput/device/batches_per_second=0.0474 +[step=16/500000] + train/ActionNoiseL2Loss=1.197 + throughput/total_tokens=3,072,000 + throughput/device/tokens_per_second=1,137 + throughput/device/batches_per_second=0.0474 +[step=17/500000] + train/ActionNoiseL2Loss=1.156 + throughput/total_tokens=3,264,000 + throughput/device/tokens_per_second=1,137 + throughput/device/batches_per_second=0.0474 +[step=18/500000] + train/ActionNoiseL2Loss=1.157 + throughput/total_tokens=3,456,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0474 +[step=19/500000] + train/ActionNoiseL2Loss=1.148 + throughput/total_tokens=3,648,000 + throughput/device/tokens_per_second=1,137 + throughput/device/batches_per_second=0.0474 +[step=20/500000] + optim/total_grad_norm=14.54 + train/ActionNoiseL2Loss=1.152 + throughput/total_tokens=3,840,000 + throughput/device/tokens_per_second=1,137 + throughput/device/batches_per_second=0.0474 + System/Peak GPU Memory (MB)=51,073 +[step=21/500000] + train/ActionNoiseL2Loss=1.121 + throughput/total_tokens=4,032,000 + throughput/device/tokens_per_second=1,137 + throughput/device/batches_per_second=0.0474 +[step=22/500000] + train/ActionNoiseL2Loss=1.293 + throughput/total_tokens=4,224,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0474 +[step=23/500000] + train/ActionNoiseL2Loss=1.132 + throughput/total_tokens=4,416,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=24/500000] + train/ActionNoiseL2Loss=1.020 + throughput/total_tokens=4,608,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=25/500000] + train/ActionNoiseL2Loss=1.042 + throughput/total_tokens=4,800,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=26/500000] + train/ActionNoiseL2Loss=1.042 + throughput/total_tokens=4,992,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0475 +[step=27/500000] + train/ActionNoiseL2Loss=1.051 + throughput/total_tokens=5,184,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0475 +[step=28/500000] + train/ActionNoiseL2Loss=1.010 + throughput/total_tokens=5,376,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=29/500000] + train/ActionNoiseL2Loss=1.014 + throughput/total_tokens=5,568,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=30/500000] + train/ActionNoiseL2Loss=0.9981 + throughput/total_tokens=5,760,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 + System/Peak GPU Memory (MB)=51,073 +[step=31/500000] + train/ActionNoiseL2Loss=0.8705 + throughput/total_tokens=5,952,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=32/500000] + train/ActionNoiseL2Loss=0.8819 + throughput/total_tokens=6,144,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=33/500000] + train/ActionNoiseL2Loss=0.9982 + throughput/total_tokens=6,336,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=34/500000] + train/ActionNoiseL2Loss=0.9402 + throughput/total_tokens=6,528,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=35/500000] + train/ActionNoiseL2Loss=0.9103 + throughput/total_tokens=6,720,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=36/500000] + train/ActionNoiseL2Loss=0.9603 + throughput/total_tokens=6,912,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=37/500000] + train/ActionNoiseL2Loss=0.8358 + throughput/total_tokens=7,104,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=38/500000] + train/ActionNoiseL2Loss=0.8783 + throughput/total_tokens=7,296,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=39/500000] + train/ActionNoiseL2Loss=0.9675 + throughput/total_tokens=7,488,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=40/500000] + optim/total_grad_norm=8.826 + train/ActionNoiseL2Loss=0.8044 + throughput/total_tokens=7,680,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 + System/Peak GPU Memory (MB)=51,076 +[step=41/500000] + train/ActionNoiseL2Loss=0.7547 + throughput/total_tokens=7,872,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=42/500000] + train/ActionNoiseL2Loss=0.8020 + throughput/total_tokens=8,064,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=43/500000] + train/ActionNoiseL2Loss=0.8448 + throughput/total_tokens=8,256,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=44/500000] + train/ActionNoiseL2Loss=0.8627 + throughput/total_tokens=8,448,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=45/500000] + train/ActionNoiseL2Loss=0.7378 + throughput/total_tokens=8,640,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=46/500000] + train/ActionNoiseL2Loss=0.7764 + throughput/total_tokens=8,832,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=47/500000] + train/ActionNoiseL2Loss=0.8475 + throughput/total_tokens=9,024,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=48/500000] + train/ActionNoiseL2Loss=0.8008 + throughput/total_tokens=9,216,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=49/500000] + train/ActionNoiseL2Loss=0.7370 + throughput/total_tokens=9,408,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=50/500000] + train/ActionNoiseL2Loss=0.7342 + throughput/total_tokens=9,600,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 + System/Peak GPU Memory (MB)=51,076 +[step=51/500000] + train/ActionNoiseL2Loss=0.6308 + throughput/total_tokens=9,792,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=52/500000] + train/ActionNoiseL2Loss=0.6825 + throughput/total_tokens=9,984,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=53/500000] + train/ActionNoiseL2Loss=0.6383 + throughput/total_tokens=10,176,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0475 +[step=54/500000] + train/ActionNoiseL2Loss=0.7288 + throughput/total_tokens=10,368,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=55/500000] + train/ActionNoiseL2Loss=0.7090 + throughput/total_tokens=10,560,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=56/500000] + train/ActionNoiseL2Loss=0.7178 + throughput/total_tokens=10,752,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=57/500000] + train/ActionNoiseL2Loss=0.6533 + throughput/total_tokens=10,944,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=58/500000] + train/ActionNoiseL2Loss=0.5923 + throughput/total_tokens=11,136,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=59/500000] + train/ActionNoiseL2Loss=0.6169 + throughput/total_tokens=11,328,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=60/500000] + optim/total_grad_norm=8.267 + train/ActionNoiseL2Loss=0.5762 + throughput/total_tokens=11,520,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 + System/Peak GPU Memory (MB)=51,076 +[step=61/500000] + train/ActionNoiseL2Loss=0.7139 + throughput/total_tokens=11,712,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=62/500000] + train/ActionNoiseL2Loss=0.6014 + throughput/total_tokens=11,904,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=63/500000] + train/ActionNoiseL2Loss=0.6061 + throughput/total_tokens=12,096,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=64/500000] + train/ActionNoiseL2Loss=0.5900 + throughput/total_tokens=12,288,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=65/500000] + train/ActionNoiseL2Loss=0.6555 + throughput/total_tokens=12,480,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0475 +[step=66/500000] + train/ActionNoiseL2Loss=0.5814 + throughput/total_tokens=12,672,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=67/500000] + train/ActionNoiseL2Loss=0.5342 + throughput/total_tokens=12,864,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=68/500000] + train/ActionNoiseL2Loss=0.5512 + throughput/total_tokens=13,056,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=69/500000] + train/ActionNoiseL2Loss=0.4740 + throughput/total_tokens=13,248,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=70/500000] + train/ActionNoiseL2Loss=0.4216 + throughput/total_tokens=13,440,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=71/500000] + train/ActionNoiseL2Loss=0.5069 + throughput/total_tokens=13,632,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=72/500000] + train/ActionNoiseL2Loss=0.6212 + throughput/total_tokens=13,824,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=73/500000] + train/ActionNoiseL2Loss=0.5242 + throughput/total_tokens=14,016,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=74/500000] + train/ActionNoiseL2Loss=0.4329 + throughput/total_tokens=14,208,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=75/500000] + train/ActionNoiseL2Loss=0.4913 + throughput/total_tokens=14,400,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=76/500000] + train/ActionNoiseL2Loss=0.4830 + throughput/total_tokens=14,592,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=77/500000] + train/ActionNoiseL2Loss=0.3968 + throughput/total_tokens=14,784,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=78/500000] + train/ActionNoiseL2Loss=0.5455 + throughput/total_tokens=14,976,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=79/500000] + train/ActionNoiseL2Loss=0.4839 + throughput/total_tokens=15,168,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=80/500000] + optim/total_grad_norm=10.55 + train/ActionNoiseL2Loss=0.4352 + throughput/total_tokens=15,360,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=81/500000] + train/ActionNoiseL2Loss=0.5366 + throughput/total_tokens=15,552,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=82/500000] + train/ActionNoiseL2Loss=0.4305 + throughput/total_tokens=15,744,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=83/500000] + train/ActionNoiseL2Loss=0.4317 + throughput/total_tokens=15,936,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=84/500000] + train/ActionNoiseL2Loss=0.4101 + throughput/total_tokens=16,128,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=85/500000] + train/ActionNoiseL2Loss=0.5972 + throughput/total_tokens=16,320,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=86/500000] + train/ActionNoiseL2Loss=0.4077 + throughput/total_tokens=16,512,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=87/500000] + train/ActionNoiseL2Loss=0.4265 + throughput/total_tokens=16,704,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=88/500000] + train/ActionNoiseL2Loss=0.4675 + throughput/total_tokens=16,896,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=89/500000] + train/ActionNoiseL2Loss=0.4191 + throughput/total_tokens=17,088,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=90/500000] + train/ActionNoiseL2Loss=0.3748 + throughput/total_tokens=17,280,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=91/500000] + train/ActionNoiseL2Loss=0.4929 + throughput/total_tokens=17,472,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=92/500000] + train/ActionNoiseL2Loss=0.4039 + throughput/total_tokens=17,664,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=93/500000] + train/ActionNoiseL2Loss=0.3737 + throughput/total_tokens=17,856,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=94/500000] + train/ActionNoiseL2Loss=0.4333 + throughput/total_tokens=18,048,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=95/500000] + train/ActionNoiseL2Loss=0.4066 + throughput/total_tokens=18,240,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=96/500000] + train/ActionNoiseL2Loss=0.3296 + throughput/total_tokens=18,432,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=97/500000] + train/ActionNoiseL2Loss=0.3486 + throughput/total_tokens=18,624,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=98/500000] + train/ActionNoiseL2Loss=0.4988 + throughput/total_tokens=18,816,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=99/500000] + train/ActionNoiseL2Loss=0.3136 + throughput/total_tokens=19,008,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=100/500000] + optim/total_grad_norm=6.078 + train/ActionNoiseL2Loss=0.4168 + throughput/total_tokens=19,200,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=101/500000] + train/ActionNoiseL2Loss=0.4496 + throughput/total_tokens=19,392,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=102/500000] + train/ActionNoiseL2Loss=0.3718 + throughput/total_tokens=19,584,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=103/500000] + train/ActionNoiseL2Loss=0.2987 + throughput/total_tokens=19,776,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=104/500000] + train/ActionNoiseL2Loss=0.3604 + throughput/total_tokens=19,968,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=105/500000] + train/ActionNoiseL2Loss=0.3747 + throughput/total_tokens=20,160,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=106/500000] + train/ActionNoiseL2Loss=0.2977 + throughput/total_tokens=20,352,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=107/500000] + train/ActionNoiseL2Loss=0.2903 + throughput/total_tokens=20,544,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0475 +[step=108/500000] + train/ActionNoiseL2Loss=0.3485 + throughput/total_tokens=20,736,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=109/500000] + train/ActionNoiseL2Loss=0.3506 + throughput/total_tokens=20,928,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=110/500000] + train/ActionNoiseL2Loss=0.2849 + throughput/total_tokens=21,120,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 + System/Peak GPU Memory (MB)=51,076 +[step=111/500000] + train/ActionNoiseL2Loss=0.2498 + throughput/total_tokens=21,312,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=112/500000] + train/ActionNoiseL2Loss=0.4222 + throughput/total_tokens=21,504,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=113/500000] + train/ActionNoiseL2Loss=0.2249 + throughput/total_tokens=21,696,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0475 +[step=114/500000] + train/ActionNoiseL2Loss=0.4359 + throughput/total_tokens=21,888,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=115/500000] + train/ActionNoiseL2Loss=0.3813 + throughput/total_tokens=22,080,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=116/500000] + train/ActionNoiseL2Loss=0.2577 + throughput/total_tokens=22,272,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=117/500000] + train/ActionNoiseL2Loss=0.2709 + throughput/total_tokens=22,464,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=118/500000] + train/ActionNoiseL2Loss=0.3620 + throughput/total_tokens=22,656,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=119/500000] + train/ActionNoiseL2Loss=0.3145 + throughput/total_tokens=22,848,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=120/500000] + optim/total_grad_norm=10.46 + train/ActionNoiseL2Loss=0.3516 + throughput/total_tokens=23,040,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=121/500000] + train/ActionNoiseL2Loss=0.2822 + throughput/total_tokens=23,232,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=122/500000] + train/ActionNoiseL2Loss=0.2792 + throughput/total_tokens=23,424,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=123/500000] + train/ActionNoiseL2Loss=0.3838 + throughput/total_tokens=23,616,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=124/500000] + train/ActionNoiseL2Loss=0.4181 + throughput/total_tokens=23,808,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=125/500000] + train/ActionNoiseL2Loss=0.2046 + throughput/total_tokens=24,000,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=126/500000] + train/ActionNoiseL2Loss=0.3426 + throughput/total_tokens=24,192,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=127/500000] + train/ActionNoiseL2Loss=0.2601 + throughput/total_tokens=24,384,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=128/500000] + train/ActionNoiseL2Loss=0.4509 + throughput/total_tokens=24,576,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=129/500000] + train/ActionNoiseL2Loss=0.2848 + throughput/total_tokens=24,768,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=130/500000] + train/ActionNoiseL2Loss=0.2213 + throughput/total_tokens=24,960,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=131/500000] + train/ActionNoiseL2Loss=0.3812 + throughput/total_tokens=25,152,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=132/500000] + train/ActionNoiseL2Loss=0.2669 + throughput/total_tokens=25,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=133/500000] + train/ActionNoiseL2Loss=0.3637 + throughput/total_tokens=25,536,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=134/500000] + train/ActionNoiseL2Loss=0.2769 + throughput/total_tokens=25,728,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=135/500000] + train/ActionNoiseL2Loss=0.3032 + throughput/total_tokens=25,920,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=136/500000] + train/ActionNoiseL2Loss=0.2963 + throughput/total_tokens=26,112,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=137/500000] + train/ActionNoiseL2Loss=0.3207 + throughput/total_tokens=26,304,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=138/500000] + train/ActionNoiseL2Loss=0.3375 + throughput/total_tokens=26,496,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=139/500000] + train/ActionNoiseL2Loss=0.2256 + throughput/total_tokens=26,688,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=140/500000] + optim/total_grad_norm=6.710 + train/ActionNoiseL2Loss=0.2705 + throughput/total_tokens=26,880,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=141/500000] + train/ActionNoiseL2Loss=0.2114 + throughput/total_tokens=27,072,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=142/500000] + train/ActionNoiseL2Loss=0.2438 + throughput/total_tokens=27,264,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=143/500000] + train/ActionNoiseL2Loss=0.2450 + throughput/total_tokens=27,456,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=144/500000] + train/ActionNoiseL2Loss=0.2556 + throughput/total_tokens=27,648,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=145/500000] + train/ActionNoiseL2Loss=0.3462 + throughput/total_tokens=27,840,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=146/500000] + train/ActionNoiseL2Loss=0.3405 + throughput/total_tokens=28,032,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=147/500000] + train/ActionNoiseL2Loss=0.2187 + throughput/total_tokens=28,224,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=148/500000] + train/ActionNoiseL2Loss=0.1648 + throughput/total_tokens=28,416,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=149/500000] + train/ActionNoiseL2Loss=0.2387 + throughput/total_tokens=28,608,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=150/500000] + train/ActionNoiseL2Loss=0.2694 + throughput/total_tokens=28,800,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=151/500000] + train/ActionNoiseL2Loss=0.2443 + throughput/total_tokens=28,992,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=152/500000] + train/ActionNoiseL2Loss=0.3691 + throughput/total_tokens=29,184,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=153/500000] + train/ActionNoiseL2Loss=0.3537 + throughput/total_tokens=29,376,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=154/500000] + train/ActionNoiseL2Loss=0.2437 + throughput/total_tokens=29,568,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=155/500000] + train/ActionNoiseL2Loss=0.3596 + throughput/total_tokens=29,760,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=156/500000] + train/ActionNoiseL2Loss=0.2188 + throughput/total_tokens=29,952,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=157/500000] + train/ActionNoiseL2Loss=0.4094 + throughput/total_tokens=30,144,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=158/500000] + train/ActionNoiseL2Loss=0.1954 + throughput/total_tokens=30,336,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=159/500000] + train/ActionNoiseL2Loss=0.1857 + throughput/total_tokens=30,528,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=160/500000] + optim/total_grad_norm=12.26 + train/ActionNoiseL2Loss=0.3247 + throughput/total_tokens=30,720,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 + System/Peak GPU Memory (MB)=51,076 +[step=161/500000] + train/ActionNoiseL2Loss=0.3050 + throughput/total_tokens=30,912,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=162/500000] + train/ActionNoiseL2Loss=0.2087 + throughput/total_tokens=31,104,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=163/500000] + train/ActionNoiseL2Loss=0.2399 + throughput/total_tokens=31,296,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=164/500000] + train/ActionNoiseL2Loss=0.2621 + throughput/total_tokens=31,488,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=165/500000] + train/ActionNoiseL2Loss=0.3091 + throughput/total_tokens=31,680,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=166/500000] + train/ActionNoiseL2Loss=0.2534 + throughput/total_tokens=31,872,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=167/500000] + train/ActionNoiseL2Loss=0.2628 + throughput/total_tokens=32,064,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=168/500000] + train/ActionNoiseL2Loss=0.3505 + throughput/total_tokens=32,256,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=169/500000] + train/ActionNoiseL2Loss=0.2734 + throughput/total_tokens=32,448,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=170/500000] + train/ActionNoiseL2Loss=0.2602 + throughput/total_tokens=32,640,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=171/500000] + train/ActionNoiseL2Loss=0.2646 + throughput/total_tokens=32,832,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=172/500000] + train/ActionNoiseL2Loss=0.1685 + throughput/total_tokens=33,024,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=173/500000] + train/ActionNoiseL2Loss=0.2083 + throughput/total_tokens=33,216,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=174/500000] + train/ActionNoiseL2Loss=0.2812 + throughput/total_tokens=33,408,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=175/500000] + train/ActionNoiseL2Loss=0.3529 + throughput/total_tokens=33,600,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=176/500000] + train/ActionNoiseL2Loss=0.2386 + throughput/total_tokens=33,792,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=177/500000] + train/ActionNoiseL2Loss=0.2328 + throughput/total_tokens=33,984,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=178/500000] + train/ActionNoiseL2Loss=0.3888 + throughput/total_tokens=34,176,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=179/500000] + train/ActionNoiseL2Loss=0.2722 + throughput/total_tokens=34,368,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=180/500000] + optim/total_grad_norm=6.009 + train/ActionNoiseL2Loss=0.1856 + throughput/total_tokens=34,560,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=181/500000] + train/ActionNoiseL2Loss=0.1854 + throughput/total_tokens=34,752,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=182/500000] + train/ActionNoiseL2Loss=0.2290 + throughput/total_tokens=34,944,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=183/500000] + train/ActionNoiseL2Loss=0.2619 + throughput/total_tokens=35,136,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=184/500000] + train/ActionNoiseL2Loss=0.2893 + throughput/total_tokens=35,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=185/500000] + train/ActionNoiseL2Loss=0.2927 + throughput/total_tokens=35,520,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=186/500000] + train/ActionNoiseL2Loss=0.2269 + throughput/total_tokens=35,712,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=187/500000] + train/ActionNoiseL2Loss=0.1694 + throughput/total_tokens=35,904,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=188/500000] + train/ActionNoiseL2Loss=0.2577 + throughput/total_tokens=36,096,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=189/500000] + train/ActionNoiseL2Loss=0.4108 + throughput/total_tokens=36,288,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=190/500000] + train/ActionNoiseL2Loss=0.1790 + throughput/total_tokens=36,480,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=191/500000] + train/ActionNoiseL2Loss=0.2157 + throughput/total_tokens=36,672,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=192/500000] + train/ActionNoiseL2Loss=0.1835 + throughput/total_tokens=36,864,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=193/500000] + train/ActionNoiseL2Loss=0.1934 + throughput/total_tokens=37,056,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=194/500000] + train/ActionNoiseL2Loss=0.2750 + throughput/total_tokens=37,248,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=195/500000] + train/ActionNoiseL2Loss=0.2744 + throughput/total_tokens=37,440,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=196/500000] + train/ActionNoiseL2Loss=0.1852 + throughput/total_tokens=37,632,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=197/500000] + train/ActionNoiseL2Loss=0.2405 + throughput/total_tokens=37,824,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=198/500000] + train/ActionNoiseL2Loss=0.1867 + throughput/total_tokens=38,016,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=199/500000] + train/ActionNoiseL2Loss=0.2228 + throughput/total_tokens=38,208,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=200/500000] + optim/total_grad_norm=6.929 + train/ActionNoiseL2Loss=0.1866 + throughput/total_tokens=38,400,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=201/500000] + train/ActionNoiseL2Loss=0.1643 + throughput/total_tokens=38,592,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=202/500000] + train/ActionNoiseL2Loss=0.3130 + throughput/total_tokens=38,784,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=203/500000] + train/ActionNoiseL2Loss=0.2355 + throughput/total_tokens=38,976,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=204/500000] + train/ActionNoiseL2Loss=0.1947 + throughput/total_tokens=39,168,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=205/500000] + train/ActionNoiseL2Loss=0.1580 + throughput/total_tokens=39,360,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=206/500000] + train/ActionNoiseL2Loss=0.1911 + throughput/total_tokens=39,552,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=207/500000] + train/ActionNoiseL2Loss=0.2952 + throughput/total_tokens=39,744,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=208/500000] + train/ActionNoiseL2Loss=0.2752 + throughput/total_tokens=39,936,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=209/500000] + train/ActionNoiseL2Loss=0.2497 + throughput/total_tokens=40,128,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=210/500000] + train/ActionNoiseL2Loss=0.1970 + throughput/total_tokens=40,320,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 + System/Peak GPU Memory (MB)=51,076 +[step=211/500000] + train/ActionNoiseL2Loss=0.3421 + throughput/total_tokens=40,512,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=212/500000] + train/ActionNoiseL2Loss=0.2197 + throughput/total_tokens=40,704,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=213/500000] + train/ActionNoiseL2Loss=0.2408 + throughput/total_tokens=40,896,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=214/500000] + train/ActionNoiseL2Loss=0.1770 + throughput/total_tokens=41,088,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=215/500000] + train/ActionNoiseL2Loss=0.2504 + throughput/total_tokens=41,280,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=216/500000] + train/ActionNoiseL2Loss=0.2978 + throughput/total_tokens=41,472,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=217/500000] + train/ActionNoiseL2Loss=0.1905 + throughput/total_tokens=41,664,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=218/500000] + train/ActionNoiseL2Loss=0.2631 + throughput/total_tokens=41,856,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=219/500000] + train/ActionNoiseL2Loss=0.2373 + throughput/total_tokens=42,048,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=220/500000] + optim/total_grad_norm=10.42 + train/ActionNoiseL2Loss=0.3217 + throughput/total_tokens=42,240,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=221/500000] + train/ActionNoiseL2Loss=0.1636 + throughput/total_tokens=42,432,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=222/500000] + train/ActionNoiseL2Loss=0.2111 + throughput/total_tokens=42,624,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=223/500000] + train/ActionNoiseL2Loss=0.2009 + throughput/total_tokens=42,816,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=224/500000] + train/ActionNoiseL2Loss=0.1348 + throughput/total_tokens=43,008,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=225/500000] + train/ActionNoiseL2Loss=0.2247 + throughput/total_tokens=43,200,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=226/500000] + train/ActionNoiseL2Loss=0.3079 + throughput/total_tokens=43,392,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=227/500000] + train/ActionNoiseL2Loss=0.2777 + throughput/total_tokens=43,584,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=228/500000] + train/ActionNoiseL2Loss=0.2443 + throughput/total_tokens=43,776,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=229/500000] + train/ActionNoiseL2Loss=0.3342 + throughput/total_tokens=43,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=230/500000] + train/ActionNoiseL2Loss=0.2273 + throughput/total_tokens=44,160,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=231/500000] + train/ActionNoiseL2Loss=0.3006 + throughput/total_tokens=44,352,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=232/500000] + train/ActionNoiseL2Loss=0.2366 + throughput/total_tokens=44,544,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=233/500000] + train/ActionNoiseL2Loss=0.1662 + throughput/total_tokens=44,736,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=234/500000] + train/ActionNoiseL2Loss=0.2410 + throughput/total_tokens=44,928,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=235/500000] + train/ActionNoiseL2Loss=0.2971 + throughput/total_tokens=45,120,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=236/500000] + train/ActionNoiseL2Loss=0.2302 + throughput/total_tokens=45,312,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=237/500000] + train/ActionNoiseL2Loss=0.1802 + throughput/total_tokens=45,504,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=238/500000] + train/ActionNoiseL2Loss=0.1807 + throughput/total_tokens=45,696,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=239/500000] + train/ActionNoiseL2Loss=0.1699 + throughput/total_tokens=45,888,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=240/500000] + optim/total_grad_norm=8.866 + train/ActionNoiseL2Loss=0.2549 + throughput/total_tokens=46,080,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=241/500000] + train/ActionNoiseL2Loss=0.2429 + throughput/total_tokens=46,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=242/500000] + train/ActionNoiseL2Loss=0.3056 + throughput/total_tokens=46,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=243/500000] + train/ActionNoiseL2Loss=0.2302 + throughput/total_tokens=46,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=244/500000] + train/ActionNoiseL2Loss=0.2132 + throughput/total_tokens=46,848,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=245/500000] + train/ActionNoiseL2Loss=0.1951 + throughput/total_tokens=47,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=246/500000] + train/ActionNoiseL2Loss=0.1965 + throughput/total_tokens=47,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=247/500000] + train/ActionNoiseL2Loss=0.2805 + throughput/total_tokens=47,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=248/500000] + train/ActionNoiseL2Loss=0.1867 + throughput/total_tokens=47,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=249/500000] + train/ActionNoiseL2Loss=0.2623 + throughput/total_tokens=47,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=250/500000] + train/ActionNoiseL2Loss=0.1689 + throughput/total_tokens=48,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=251/500000] + train/ActionNoiseL2Loss=0.1813 + throughput/total_tokens=48,192,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=252/500000] + train/ActionNoiseL2Loss=0.1525 + throughput/total_tokens=48,384,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=253/500000] + train/ActionNoiseL2Loss=0.2099 + throughput/total_tokens=48,576,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=254/500000] + train/ActionNoiseL2Loss=0.1689 + throughput/total_tokens=48,768,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=255/500000] + train/ActionNoiseL2Loss=0.1582 + throughput/total_tokens=48,960,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=256/500000] + train/ActionNoiseL2Loss=0.2659 + throughput/total_tokens=49,152,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=257/500000] + train/ActionNoiseL2Loss=0.1480 + throughput/total_tokens=49,344,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=258/500000] + train/ActionNoiseL2Loss=0.1836 + throughput/total_tokens=49,536,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=259/500000] + train/ActionNoiseL2Loss=0.2814 + throughput/total_tokens=49,728,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=260/500000] + optim/total_grad_norm=7.971 + train/ActionNoiseL2Loss=0.2725 + throughput/total_tokens=49,920,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=261/500000] + train/ActionNoiseL2Loss=0.1896 + throughput/total_tokens=50,112,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=262/500000] + train/ActionNoiseL2Loss=0.2173 + throughput/total_tokens=50,304,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=263/500000] + train/ActionNoiseL2Loss=0.2441 + throughput/total_tokens=50,496,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=264/500000] + train/ActionNoiseL2Loss=0.2635 + throughput/total_tokens=50,688,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=265/500000] + train/ActionNoiseL2Loss=0.3150 + throughput/total_tokens=50,880,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=266/500000] + train/ActionNoiseL2Loss=0.2075 + throughput/total_tokens=51,072,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=267/500000] + train/ActionNoiseL2Loss=0.2010 + throughput/total_tokens=51,264,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=268/500000] + train/ActionNoiseL2Loss=0.2119 + throughput/total_tokens=51,456,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=269/500000] + train/ActionNoiseL2Loss=0.2493 + throughput/total_tokens=51,648,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=270/500000] + train/ActionNoiseL2Loss=0.2076 + throughput/total_tokens=51,840,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=271/500000] + train/ActionNoiseL2Loss=0.1884 + throughput/total_tokens=52,032,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=272/500000] + train/ActionNoiseL2Loss=0.1927 + throughput/total_tokens=52,224,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=273/500000] + train/ActionNoiseL2Loss=0.2474 + throughput/total_tokens=52,416,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=274/500000] + train/ActionNoiseL2Loss=0.2009 + throughput/total_tokens=52,608,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=275/500000] + train/ActionNoiseL2Loss=0.1578 + throughput/total_tokens=52,800,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=276/500000] + train/ActionNoiseL2Loss=0.2378 + throughput/total_tokens=52,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=277/500000] + train/ActionNoiseL2Loss=0.2924 + throughput/total_tokens=53,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=278/500000] + train/ActionNoiseL2Loss=0.2547 + throughput/total_tokens=53,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=279/500000] + train/ActionNoiseL2Loss=0.2377 + throughput/total_tokens=53,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=280/500000] + optim/total_grad_norm=9.087 + train/ActionNoiseL2Loss=0.2162 + throughput/total_tokens=53,760,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=281/500000] + train/ActionNoiseL2Loss=0.2772 + throughput/total_tokens=53,952,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=282/500000] + train/ActionNoiseL2Loss=0.3190 + throughput/total_tokens=54,144,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=283/500000] + train/ActionNoiseL2Loss=0.1921 + throughput/total_tokens=54,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=284/500000] + train/ActionNoiseL2Loss=0.2171 + throughput/total_tokens=54,528,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=285/500000] + train/ActionNoiseL2Loss=0.1544 + throughput/total_tokens=54,720,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=286/500000] + train/ActionNoiseL2Loss=0.2547 + throughput/total_tokens=54,912,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=287/500000] + train/ActionNoiseL2Loss=0.2228 + throughput/total_tokens=55,104,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=288/500000] + train/ActionNoiseL2Loss=0.2570 + throughput/total_tokens=55,296,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=289/500000] + train/ActionNoiseL2Loss=0.3060 + throughput/total_tokens=55,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=290/500000] + train/ActionNoiseL2Loss=0.2145 + throughput/total_tokens=55,680,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=291/500000] + train/ActionNoiseL2Loss=0.2196 + throughput/total_tokens=55,872,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=292/500000] + train/ActionNoiseL2Loss=0.2024 + throughput/total_tokens=56,064,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=293/500000] + train/ActionNoiseL2Loss=0.2615 + throughput/total_tokens=56,256,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=294/500000] + train/ActionNoiseL2Loss=0.1390 + throughput/total_tokens=56,448,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=295/500000] + train/ActionNoiseL2Loss=0.1421 + throughput/total_tokens=56,640,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=296/500000] + train/ActionNoiseL2Loss=0.1699 + throughput/total_tokens=56,832,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=297/500000] + train/ActionNoiseL2Loss=0.2362 + throughput/total_tokens=57,024,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=298/500000] + train/ActionNoiseL2Loss=0.2107 + throughput/total_tokens=57,216,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=299/500000] + train/ActionNoiseL2Loss=0.1247 + throughput/total_tokens=57,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=300/500000] + optim/total_grad_norm=8.917 + train/ActionNoiseL2Loss=0.3213 + throughput/total_tokens=57,600,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=301/500000] + train/ActionNoiseL2Loss=0.1995 + throughput/total_tokens=57,792,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=302/500000] + train/ActionNoiseL2Loss=0.1711 + throughput/total_tokens=57,984,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=303/500000] + train/ActionNoiseL2Loss=0.1121 + throughput/total_tokens=58,176,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=304/500000] + train/ActionNoiseL2Loss=0.2212 + throughput/total_tokens=58,368,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=305/500000] + train/ActionNoiseL2Loss=0.1831 + throughput/total_tokens=58,560,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=306/500000] + train/ActionNoiseL2Loss=0.2619 + throughput/total_tokens=58,752,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=307/500000] + train/ActionNoiseL2Loss=0.2711 + throughput/total_tokens=58,944,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=308/500000] + train/ActionNoiseL2Loss=0.2428 + throughput/total_tokens=59,136,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=309/500000] + train/ActionNoiseL2Loss=0.1866 + throughput/total_tokens=59,328,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=310/500000] + train/ActionNoiseL2Loss=0.2395 + throughput/total_tokens=59,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=311/500000] + train/ActionNoiseL2Loss=0.1835 + throughput/total_tokens=59,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=312/500000] + train/ActionNoiseL2Loss=0.1972 + throughput/total_tokens=59,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=313/500000] + train/ActionNoiseL2Loss=0.2390 + throughput/total_tokens=60,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=314/500000] + train/ActionNoiseL2Loss=0.2208 + throughput/total_tokens=60,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=315/500000] + train/ActionNoiseL2Loss=0.1820 + throughput/total_tokens=60,480,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=316/500000] + train/ActionNoiseL2Loss=0.1788 + throughput/total_tokens=60,672,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=317/500000] + train/ActionNoiseL2Loss=0.1916 + throughput/total_tokens=60,864,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=318/500000] + train/ActionNoiseL2Loss=0.1848 + throughput/total_tokens=61,056,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=319/500000] + train/ActionNoiseL2Loss=0.1941 + throughput/total_tokens=61,248,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=320/500000] + optim/total_grad_norm=4.298 + train/ActionNoiseL2Loss=0.1485 + throughput/total_tokens=61,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=321/500000] + train/ActionNoiseL2Loss=0.1607 + throughput/total_tokens=61,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=322/500000] + train/ActionNoiseL2Loss=0.3072 + throughput/total_tokens=61,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=323/500000] + train/ActionNoiseL2Loss=0.3027 + throughput/total_tokens=62,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=324/500000] + train/ActionNoiseL2Loss=0.1642 + throughput/total_tokens=62,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=325/500000] + train/ActionNoiseL2Loss=0.2820 + throughput/total_tokens=62,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=326/500000] + train/ActionNoiseL2Loss=0.1822 + throughput/total_tokens=62,592,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=327/500000] + train/ActionNoiseL2Loss=0.2096 + throughput/total_tokens=62,784,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=328/500000] + train/ActionNoiseL2Loss=0.2001 + throughput/total_tokens=62,976,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=329/500000] + train/ActionNoiseL2Loss=0.1698 + throughput/total_tokens=63,168,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=330/500000] + train/ActionNoiseL2Loss=0.2273 + throughput/total_tokens=63,360,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=331/500000] + train/ActionNoiseL2Loss=0.1660 + throughput/total_tokens=63,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=332/500000] + train/ActionNoiseL2Loss=0.1264 + throughput/total_tokens=63,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=333/500000] + train/ActionNoiseL2Loss=0.1762 + throughput/total_tokens=63,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=334/500000] + train/ActionNoiseL2Loss=0.1701 + throughput/total_tokens=64,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=335/500000] + train/ActionNoiseL2Loss=0.0936 + throughput/total_tokens=64,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=336/500000] + train/ActionNoiseL2Loss=0.1166 + throughput/total_tokens=64,512,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=337/500000] + train/ActionNoiseL2Loss=0.2621 + throughput/total_tokens=64,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=338/500000] + train/ActionNoiseL2Loss=0.3394 + throughput/total_tokens=64,896,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=339/500000] + train/ActionNoiseL2Loss=0.2995 + throughput/total_tokens=65,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=340/500000] + optim/total_grad_norm=5.948 + train/ActionNoiseL2Loss=0.1478 + throughput/total_tokens=65,280,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=341/500000] + train/ActionNoiseL2Loss=0.2637 + throughput/total_tokens=65,472,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=342/500000] + train/ActionNoiseL2Loss=0.2835 + throughput/total_tokens=65,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=343/500000] + train/ActionNoiseL2Loss=0.2141 + throughput/total_tokens=65,856,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=344/500000] + train/ActionNoiseL2Loss=0.1004 + throughput/total_tokens=66,048,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=345/500000] + train/ActionNoiseL2Loss=0.2630 + throughput/total_tokens=66,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=346/500000] + train/ActionNoiseL2Loss=0.1676 + throughput/total_tokens=66,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=347/500000] + train/ActionNoiseL2Loss=0.1561 + throughput/total_tokens=66,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=348/500000] + train/ActionNoiseL2Loss=0.1854 + throughput/total_tokens=66,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=349/500000] + train/ActionNoiseL2Loss=0.3514 + throughput/total_tokens=67,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=350/500000] + train/ActionNoiseL2Loss=0.1847 + throughput/total_tokens=67,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=351/500000] + train/ActionNoiseL2Loss=0.2024 + throughput/total_tokens=67,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=352/500000] + train/ActionNoiseL2Loss=0.2149 + throughput/total_tokens=67,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=353/500000] + train/ActionNoiseL2Loss=0.1842 + throughput/total_tokens=67,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=354/500000] + train/ActionNoiseL2Loss=0.1598 + throughput/total_tokens=67,968,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=355/500000] + train/ActionNoiseL2Loss=0.2152 + throughput/total_tokens=68,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=356/500000] + train/ActionNoiseL2Loss=0.2375 + throughput/total_tokens=68,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=357/500000] + train/ActionNoiseL2Loss=0.1946 + throughput/total_tokens=68,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=358/500000] + train/ActionNoiseL2Loss=0.2454 + throughput/total_tokens=68,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=359/500000] + train/ActionNoiseL2Loss=0.1150 + throughput/total_tokens=68,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=360/500000] + optim/total_grad_norm=4.916 + train/ActionNoiseL2Loss=0.1861 + throughput/total_tokens=69,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=361/500000] + train/ActionNoiseL2Loss=0.1355 + throughput/total_tokens=69,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=362/500000] + train/ActionNoiseL2Loss=0.2826 + throughput/total_tokens=69,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=363/500000] + train/ActionNoiseL2Loss=0.1953 + throughput/total_tokens=69,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=364/500000] + train/ActionNoiseL2Loss=0.1954 + throughput/total_tokens=69,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=365/500000] + train/ActionNoiseL2Loss=0.1627 + throughput/total_tokens=70,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=366/500000] + train/ActionNoiseL2Loss=0.1465 + throughput/total_tokens=70,272,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=367/500000] + train/ActionNoiseL2Loss=0.2114 + throughput/total_tokens=70,464,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=368/500000] + train/ActionNoiseL2Loss=0.1460 + throughput/total_tokens=70,656,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=369/500000] + train/ActionNoiseL2Loss=0.1578 + throughput/total_tokens=70,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=370/500000] + train/ActionNoiseL2Loss=0.1653 + throughput/total_tokens=71,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=371/500000] + train/ActionNoiseL2Loss=0.1645 + throughput/total_tokens=71,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=372/500000] + train/ActionNoiseL2Loss=0.1302 + throughput/total_tokens=71,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=373/500000] + train/ActionNoiseL2Loss=0.1583 + throughput/total_tokens=71,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=374/500000] + train/ActionNoiseL2Loss=0.2586 + throughput/total_tokens=71,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=375/500000] + train/ActionNoiseL2Loss=0.1699 + throughput/total_tokens=72,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=376/500000] + train/ActionNoiseL2Loss=0.1574 + throughput/total_tokens=72,192,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=377/500000] + train/ActionNoiseL2Loss=0.2525 + throughput/total_tokens=72,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=378/500000] + train/ActionNoiseL2Loss=0.1637 + throughput/total_tokens=72,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=379/500000] + train/ActionNoiseL2Loss=0.1996 + throughput/total_tokens=72,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=380/500000] + optim/total_grad_norm=4.164 + train/ActionNoiseL2Loss=0.1426 + throughput/total_tokens=72,960,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=381/500000] + train/ActionNoiseL2Loss=0.1314 + throughput/total_tokens=73,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=382/500000] + train/ActionNoiseL2Loss=0.1309 + throughput/total_tokens=73,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=383/500000] + train/ActionNoiseL2Loss=0.3440 + throughput/total_tokens=73,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=384/500000] + train/ActionNoiseL2Loss=0.2311 + throughput/total_tokens=73,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=385/500000] + train/ActionNoiseL2Loss=0.1530 + throughput/total_tokens=73,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=386/500000] + train/ActionNoiseL2Loss=0.2763 + throughput/total_tokens=74,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=387/500000] + train/ActionNoiseL2Loss=0.1570 + throughput/total_tokens=74,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=388/500000] + train/ActionNoiseL2Loss=0.1418 + throughput/total_tokens=74,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=389/500000] + train/ActionNoiseL2Loss=0.1138 + throughput/total_tokens=74,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=390/500000] + train/ActionNoiseL2Loss=0.1271 + throughput/total_tokens=74,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=391/500000] + train/ActionNoiseL2Loss=0.2529 + throughput/total_tokens=75,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=392/500000] + train/ActionNoiseL2Loss=0.1736 + throughput/total_tokens=75,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=393/500000] + train/ActionNoiseL2Loss=0.1746 + throughput/total_tokens=75,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=394/500000] + train/ActionNoiseL2Loss=0.1882 + throughput/total_tokens=75,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=395/500000] + train/ActionNoiseL2Loss=0.2242 + throughput/total_tokens=75,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=396/500000] + train/ActionNoiseL2Loss=0.1332 + throughput/total_tokens=76,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=397/500000] + train/ActionNoiseL2Loss=0.2152 + throughput/total_tokens=76,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=398/500000] + train/ActionNoiseL2Loss=0.1635 + throughput/total_tokens=76,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=399/500000] + train/ActionNoiseL2Loss=0.1624 + throughput/total_tokens=76,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=400/500000] + optim/total_grad_norm=7.385 + train/ActionNoiseL2Loss=0.2042 + throughput/total_tokens=76,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=401/500000] + train/ActionNoiseL2Loss=0.1373 + throughput/total_tokens=76,992,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=402/500000] + train/ActionNoiseL2Loss=0.1018 + throughput/total_tokens=77,184,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=403/500000] + train/ActionNoiseL2Loss=0.1157 + throughput/total_tokens=77,376,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=404/500000] + train/ActionNoiseL2Loss=0.1655 + throughput/total_tokens=77,568,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=405/500000] + train/ActionNoiseL2Loss=0.1159 + throughput/total_tokens=77,760,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=406/500000] + train/ActionNoiseL2Loss=0.1139 + throughput/total_tokens=77,952,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=407/500000] + train/ActionNoiseL2Loss=0.1526 + throughput/total_tokens=78,144,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=408/500000] + train/ActionNoiseL2Loss=0.1261 + throughput/total_tokens=78,336,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=409/500000] + train/ActionNoiseL2Loss=0.1505 + throughput/total_tokens=78,528,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=410/500000] + train/ActionNoiseL2Loss=0.2511 + throughput/total_tokens=78,720,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=411/500000] + train/ActionNoiseL2Loss=0.1939 + throughput/total_tokens=78,912,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=412/500000] + train/ActionNoiseL2Loss=0.2115 + throughput/total_tokens=79,104,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=413/500000] + train/ActionNoiseL2Loss=0.2044 + throughput/total_tokens=79,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=414/500000] + train/ActionNoiseL2Loss=0.2037 + throughput/total_tokens=79,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=415/500000] + train/ActionNoiseL2Loss=0.1784 + throughput/total_tokens=79,680,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=416/500000] + train/ActionNoiseL2Loss=0.2150 + throughput/total_tokens=79,872,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=417/500000] + train/ActionNoiseL2Loss=0.1437 + throughput/total_tokens=80,064,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=418/500000] + train/ActionNoiseL2Loss=0.1482 + throughput/total_tokens=80,256,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=419/500000] + train/ActionNoiseL2Loss=0.1928 + throughput/total_tokens=80,448,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=420/500000] + optim/total_grad_norm=8.263 + train/ActionNoiseL2Loss=0.2725 + throughput/total_tokens=80,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=421/500000] + train/ActionNoiseL2Loss=0.2287 + throughput/total_tokens=80,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=422/500000] + train/ActionNoiseL2Loss=0.1878 + throughput/total_tokens=81,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=423/500000] + train/ActionNoiseL2Loss=0.1858 + throughput/total_tokens=81,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=424/500000] + train/ActionNoiseL2Loss=0.1303 + throughput/total_tokens=81,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=425/500000] + train/ActionNoiseL2Loss=0.1913 + throughput/total_tokens=81,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=426/500000] + train/ActionNoiseL2Loss=0.1467 + throughput/total_tokens=81,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=427/500000] + train/ActionNoiseL2Loss=0.2138 + throughput/total_tokens=81,984,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=428/500000] + train/ActionNoiseL2Loss=0.1507 + throughput/total_tokens=82,176,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=429/500000] + train/ActionNoiseL2Loss=0.1733 + throughput/total_tokens=82,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=430/500000] + train/ActionNoiseL2Loss=0.1434 + throughput/total_tokens=82,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=431/500000] + train/ActionNoiseL2Loss=0.1475 + throughput/total_tokens=82,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=432/500000] + train/ActionNoiseL2Loss=0.1511 + throughput/total_tokens=82,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=433/500000] + train/ActionNoiseL2Loss=0.1949 + throughput/total_tokens=83,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=434/500000] + train/ActionNoiseL2Loss=0.1547 + throughput/total_tokens=83,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=435/500000] + train/ActionNoiseL2Loss=0.1464 + throughput/total_tokens=83,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=436/500000] + train/ActionNoiseL2Loss=0.1524 + throughput/total_tokens=83,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=437/500000] + train/ActionNoiseL2Loss=0.1898 + throughput/total_tokens=83,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=438/500000] + train/ActionNoiseL2Loss=0.1673 + throughput/total_tokens=84,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=439/500000] + train/ActionNoiseL2Loss=0.1729 + throughput/total_tokens=84,288,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=440/500000] + optim/total_grad_norm=3.265 + train/ActionNoiseL2Loss=0.1441 + throughput/total_tokens=84,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=441/500000] + train/ActionNoiseL2Loss=0.1977 + throughput/total_tokens=84,672,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=442/500000] + train/ActionNoiseL2Loss=0.1632 + throughput/total_tokens=84,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=443/500000] + train/ActionNoiseL2Loss=0.1854 + throughput/total_tokens=85,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=444/500000] + train/ActionNoiseL2Loss=0.1962 + throughput/total_tokens=85,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=445/500000] + train/ActionNoiseL2Loss=0.2512 + throughput/total_tokens=85,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=446/500000] + train/ActionNoiseL2Loss=0.1144 + throughput/total_tokens=85,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=447/500000] + train/ActionNoiseL2Loss=0.2064 + throughput/total_tokens=85,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=448/500000] + train/ActionNoiseL2Loss=0.2244 + throughput/total_tokens=86,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=449/500000] + train/ActionNoiseL2Loss=0.2228 + throughput/total_tokens=86,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=450/500000] + train/ActionNoiseL2Loss=0.1800 + throughput/total_tokens=86,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=451/500000] + train/ActionNoiseL2Loss=0.2390 + throughput/total_tokens=86,592,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=452/500000] + train/ActionNoiseL2Loss=0.2206 + throughput/total_tokens=86,784,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=453/500000] + train/ActionNoiseL2Loss=0.2795 + throughput/total_tokens=86,976,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=454/500000] + train/ActionNoiseL2Loss=0.1973 + throughput/total_tokens=87,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=455/500000] + train/ActionNoiseL2Loss=0.3017 + throughput/total_tokens=87,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=456/500000] + train/ActionNoiseL2Loss=0.2774 + throughput/total_tokens=87,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=457/500000] + train/ActionNoiseL2Loss=0.2321 + throughput/total_tokens=87,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=458/500000] + train/ActionNoiseL2Loss=0.2298 + throughput/total_tokens=87,936,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=459/500000] + train/ActionNoiseL2Loss=0.1010 + throughput/total_tokens=88,128,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=460/500000] + optim/total_grad_norm=5.987 + train/ActionNoiseL2Loss=0.1739 + throughput/total_tokens=88,320,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=461/500000] + train/ActionNoiseL2Loss=0.2274 + throughput/total_tokens=88,512,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=462/500000] + train/ActionNoiseL2Loss=0.2027 + throughput/total_tokens=88,704,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=463/500000] + train/ActionNoiseL2Loss=0.1937 + throughput/total_tokens=88,896,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=464/500000] + train/ActionNoiseL2Loss=0.1859 + throughput/total_tokens=89,088,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=465/500000] + train/ActionNoiseL2Loss=0.1609 + throughput/total_tokens=89,280,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=466/500000] + train/ActionNoiseL2Loss=0.1595 + throughput/total_tokens=89,472,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=467/500000] + train/ActionNoiseL2Loss=0.1508 + throughput/total_tokens=89,664,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=468/500000] + train/ActionNoiseL2Loss=0.2593 + throughput/total_tokens=89,856,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=469/500000] + train/ActionNoiseL2Loss=0.1269 + throughput/total_tokens=90,048,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=470/500000] + train/ActionNoiseL2Loss=0.2105 + throughput/total_tokens=90,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=471/500000] + train/ActionNoiseL2Loss=0.1066 + throughput/total_tokens=90,432,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=472/500000] + train/ActionNoiseL2Loss=0.1105 + throughput/total_tokens=90,624,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=473/500000] + train/ActionNoiseL2Loss=0.1957 + throughput/total_tokens=90,816,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=474/500000] + train/ActionNoiseL2Loss=0.1474 + throughput/total_tokens=91,008,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=475/500000] + train/ActionNoiseL2Loss=0.1192 + throughput/total_tokens=91,200,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=476/500000] + train/ActionNoiseL2Loss=0.1914 + throughput/total_tokens=91,392,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=477/500000] + train/ActionNoiseL2Loss=0.2541 + throughput/total_tokens=91,584,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=478/500000] + train/ActionNoiseL2Loss=0.1135 + throughput/total_tokens=91,776,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=479/500000] + train/ActionNoiseL2Loss=0.1993 + throughput/total_tokens=91,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=480/500000] + optim/total_grad_norm=7.383 + train/ActionNoiseL2Loss=0.1830 + throughput/total_tokens=92,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=481/500000] + train/ActionNoiseL2Loss=0.2202 + throughput/total_tokens=92,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=482/500000] + train/ActionNoiseL2Loss=0.1198 + throughput/total_tokens=92,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=483/500000] + train/ActionNoiseL2Loss=0.2074 + throughput/total_tokens=92,736,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=484/500000] + train/ActionNoiseL2Loss=0.1524 + throughput/total_tokens=92,928,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=485/500000] + train/ActionNoiseL2Loss=0.2132 + throughput/total_tokens=93,120,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=486/500000] + train/ActionNoiseL2Loss=0.1097 + throughput/total_tokens=93,312,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=487/500000] + train/ActionNoiseL2Loss=0.1752 + throughput/total_tokens=93,504,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=488/500000] + train/ActionNoiseL2Loss=0.1278 + throughput/total_tokens=93,696,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=489/500000] + train/ActionNoiseL2Loss=0.1890 + throughput/total_tokens=93,888,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=490/500000] + train/ActionNoiseL2Loss=0.1337 + throughput/total_tokens=94,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=491/500000] + train/ActionNoiseL2Loss=0.1564 + throughput/total_tokens=94,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=492/500000] + train/ActionNoiseL2Loss=0.1148 + throughput/total_tokens=94,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=493/500000] + train/ActionNoiseL2Loss=0.1232 + throughput/total_tokens=94,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=494/500000] + train/ActionNoiseL2Loss=0.1425 + throughput/total_tokens=94,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=495/500000] + train/ActionNoiseL2Loss=0.1775 + throughput/total_tokens=95,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=496/500000] + train/ActionNoiseL2Loss=0.2473 + throughput/total_tokens=95,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=497/500000] + train/ActionNoiseL2Loss=0.1580 + throughput/total_tokens=95,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=498/500000] + train/ActionNoiseL2Loss=0.2051 + throughput/total_tokens=95,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=499/500000] + train/ActionNoiseL2Loss=0.1246 + throughput/total_tokens=95,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=500/500000] + optim/total_grad_norm=10.87 + train/ActionNoiseL2Loss=0.1246 + throughput/total_tokens=96,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +10/11 [19:35:44] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/fully_sharded_data_parallel.py:678: warnings.py:109 + FutureWarning: FSDP.state_dict_type() and FSDP.set_state_dict_type() are being deprecated. Please use APIs, get_state_dict() and + set_state_dict(), which can support different parallelisms, FSDP1, FSDP2, DDP. API doc: + https://pytorch.org/docs/stable/distributed.checkpoint.html#torch.distributed.checkpoint.state_dict.get_state_dict .Tutorial: + https://pytorch.org/tutorials/recipes/distributed_checkpoint_recipe.html . + warnings.warn( + + WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:860: UserWarning: warnings.py:109 + `_get_pg_default_device` will be deprecated, it only stays for backward-compatiblity reason. If you need to find a device for object + collectives, please use `_get_object_coll_device`. If you need to query the device types supported by group, please use + `_device_capability(group)`. + warnings.warn( + +10/11 [19:35:46] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:722: FutureWarning: warnings.py:109 + Please use DTensor instead and we are deprecating ShardedTensor. + local_shape = tensor.shape + + WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:739: FutureWarning: warnings.py:109 + Please use DTensor instead and we are deprecating ShardedTensor. + tensor.shape, + + WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:741: FutureWarning: warnings.py:109 + Please use DTensor instead and we are deprecating ShardedTensor. + tensor.dtype, + +10/11 [19:35:50] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/overrides.py:1747: FutureWarning: Please use DTensor warnings.py:109 + instead and we are deprecating ShardedTensor. + result = torch_func_method(public_api, types, args, kwargs) + +10/11 [19:36:22] INFO | >> Saving config... checkpoint.py:608 +10/11 [19:36:48] INFO | >> Saving model state... checkpoint.py:796 +10/11 [19:38:00] INFO | >> Saving optim state... checkpoint.py:811 +10/11 [19:39:29] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=501/500000] + train/ActionNoiseL2Loss=0.1703 + throughput/total_tokens=96,192,000 + throughput/device/tokens_per_second=1,131 + throughput/device/batches_per_second=0.0472 +[step=502/500000] + train/ActionNoiseL2Loss=0.1513 + throughput/total_tokens=96,384,000 + throughput/device/tokens_per_second=1,137 + throughput/device/batches_per_second=0.0474 +[step=503/500000] + train/ActionNoiseL2Loss=0.2198 + throughput/total_tokens=96,576,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=504/500000] + train/ActionNoiseL2Loss=0.2441 + throughput/total_tokens=96,768,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=505/500000] + train/ActionNoiseL2Loss=0.1812 + throughput/total_tokens=96,960,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=506/500000] + train/ActionNoiseL2Loss=0.2084 + throughput/total_tokens=97,152,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=507/500000] + train/ActionNoiseL2Loss=0.1542 + throughput/total_tokens=97,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=508/500000] + train/ActionNoiseL2Loss=0.1440 + throughput/total_tokens=97,536,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=509/500000] + train/ActionNoiseL2Loss=0.2206 + throughput/total_tokens=97,728,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=510/500000] + train/ActionNoiseL2Loss=0.1816 + throughput/total_tokens=97,920,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=511/500000] + train/ActionNoiseL2Loss=0.1990 + throughput/total_tokens=98,112,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=512/500000] + train/ActionNoiseL2Loss=0.2182 + throughput/total_tokens=98,304,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=513/500000] + train/ActionNoiseL2Loss=0.1781 + throughput/total_tokens=98,496,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=514/500000] + train/ActionNoiseL2Loss=0.1553 + throughput/total_tokens=98,688,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=515/500000] + train/ActionNoiseL2Loss=0.2015 + throughput/total_tokens=98,880,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=516/500000] + train/ActionNoiseL2Loss=0.1636 + throughput/total_tokens=99,072,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=517/500000] + train/ActionNoiseL2Loss=0.1387 + throughput/total_tokens=99,264,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=518/500000] + train/ActionNoiseL2Loss=0.1385 + throughput/total_tokens=99,456,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=519/500000] + train/ActionNoiseL2Loss=0.2959 + throughput/total_tokens=99,648,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=520/500000] + optim/total_grad_norm=6.407 + train/ActionNoiseL2Loss=0.1302 + throughput/total_tokens=99,840,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=521/500000] + train/ActionNoiseL2Loss=0.1554 + throughput/total_tokens=100,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=522/500000] + train/ActionNoiseL2Loss=0.1240 + throughput/total_tokens=100,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=523/500000] + train/ActionNoiseL2Loss=0.1614 + throughput/total_tokens=100,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=524/500000] + train/ActionNoiseL2Loss=0.2435 + throughput/total_tokens=100,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=525/500000] + train/ActionNoiseL2Loss=0.2351 + throughput/total_tokens=100,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=526/500000] + train/ActionNoiseL2Loss=0.1233 + throughput/total_tokens=100,992,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=527/500000] + train/ActionNoiseL2Loss=0.2120 + throughput/total_tokens=101,184,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=528/500000] + train/ActionNoiseL2Loss=0.0994 + throughput/total_tokens=101,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=529/500000] + train/ActionNoiseL2Loss=0.1526 + throughput/total_tokens=101,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=530/500000] + train/ActionNoiseL2Loss=0.2704 + throughput/total_tokens=101,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=531/500000] + train/ActionNoiseL2Loss=0.1251 + throughput/total_tokens=101,952,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=532/500000] + train/ActionNoiseL2Loss=0.2321 + throughput/total_tokens=102,144,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=533/500000] + train/ActionNoiseL2Loss=0.3532 + throughput/total_tokens=102,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=534/500000] + train/ActionNoiseL2Loss=0.2260 + throughput/total_tokens=102,528,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=535/500000] + train/ActionNoiseL2Loss=0.1945 + throughput/total_tokens=102,720,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=536/500000] + train/ActionNoiseL2Loss=0.2155 + throughput/total_tokens=102,912,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=537/500000] + train/ActionNoiseL2Loss=0.2838 + throughput/total_tokens=103,104,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=538/500000] + train/ActionNoiseL2Loss=0.2423 + throughput/total_tokens=103,296,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=539/500000] + train/ActionNoiseL2Loss=0.1487 + throughput/total_tokens=103,488,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=540/500000] + optim/total_grad_norm=3.650 + train/ActionNoiseL2Loss=0.0879 + throughput/total_tokens=103,680,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=541/500000] + train/ActionNoiseL2Loss=0.1030 + throughput/total_tokens=103,872,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=542/500000] + train/ActionNoiseL2Loss=0.1304 + throughput/total_tokens=104,064,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=543/500000] + train/ActionNoiseL2Loss=0.1198 + throughput/total_tokens=104,256,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=544/500000] + train/ActionNoiseL2Loss=0.1425 + throughput/total_tokens=104,448,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=545/500000] + train/ActionNoiseL2Loss=0.1701 + throughput/total_tokens=104,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=546/500000] + train/ActionNoiseL2Loss=0.1488 + throughput/total_tokens=104,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=547/500000] + train/ActionNoiseL2Loss=0.1018 + throughput/total_tokens=105,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=548/500000] + train/ActionNoiseL2Loss=0.1244 + throughput/total_tokens=105,216,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=549/500000] + train/ActionNoiseL2Loss=0.1038 + throughput/total_tokens=105,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=550/500000] + train/ActionNoiseL2Loss=0.1880 + throughput/total_tokens=105,600,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=551/500000] + train/ActionNoiseL2Loss=0.1209 + throughput/total_tokens=105,792,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=552/500000] + train/ActionNoiseL2Loss=0.1092 + throughput/total_tokens=105,984,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=553/500000] + train/ActionNoiseL2Loss=0.1044 + throughput/total_tokens=106,176,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=554/500000] + train/ActionNoiseL2Loss=0.1918 + throughput/total_tokens=106,368,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=555/500000] + train/ActionNoiseL2Loss=0.1954 + throughput/total_tokens=106,560,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=556/500000] + train/ActionNoiseL2Loss=0.1223 + throughput/total_tokens=106,752,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=557/500000] + train/ActionNoiseL2Loss=0.1902 + throughput/total_tokens=106,944,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=558/500000] + train/ActionNoiseL2Loss=0.1843 + throughput/total_tokens=107,136,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=559/500000] + train/ActionNoiseL2Loss=0.2216 + throughput/total_tokens=107,328,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=560/500000] + optim/total_grad_norm=4.657 + train/ActionNoiseL2Loss=0.0978 + throughput/total_tokens=107,520,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=561/500000] + train/ActionNoiseL2Loss=0.2161 + throughput/total_tokens=107,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=562/500000] + train/ActionNoiseL2Loss=0.1356 + throughput/total_tokens=107,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=563/500000] + train/ActionNoiseL2Loss=0.1833 + throughput/total_tokens=108,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=564/500000] + train/ActionNoiseL2Loss=0.1330 + throughput/total_tokens=108,288,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=565/500000] + train/ActionNoiseL2Loss=0.1567 + throughput/total_tokens=108,480,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=566/500000] + train/ActionNoiseL2Loss=0.0990 + throughput/total_tokens=108,672,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=567/500000] + train/ActionNoiseL2Loss=0.1550 + throughput/total_tokens=108,864,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=568/500000] + train/ActionNoiseL2Loss=0.2928 + throughput/total_tokens=109,056,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=569/500000] + train/ActionNoiseL2Loss=0.1625 + throughput/total_tokens=109,248,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=570/500000] + train/ActionNoiseL2Loss=0.1505 + throughput/total_tokens=109,440,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=571/500000] + train/ActionNoiseL2Loss=0.2306 + throughput/total_tokens=109,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=572/500000] + train/ActionNoiseL2Loss=0.1405 + throughput/total_tokens=109,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=573/500000] + train/ActionNoiseL2Loss=0.1500 + throughput/total_tokens=110,016,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=574/500000] + train/ActionNoiseL2Loss=0.1048 + throughput/total_tokens=110,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=575/500000] + train/ActionNoiseL2Loss=0.2139 + throughput/total_tokens=110,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=576/500000] + train/ActionNoiseL2Loss=0.1411 + throughput/total_tokens=110,592,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=577/500000] + train/ActionNoiseL2Loss=0.1230 + throughput/total_tokens=110,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=578/500000] + train/ActionNoiseL2Loss=0.0924 + throughput/total_tokens=110,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=579/500000] + train/ActionNoiseL2Loss=0.2190 + throughput/total_tokens=111,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=580/500000] + optim/total_grad_norm=8.056 + train/ActionNoiseL2Loss=0.2865 + throughput/total_tokens=111,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=581/500000] + train/ActionNoiseL2Loss=0.3435 + throughput/total_tokens=111,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=582/500000] + train/ActionNoiseL2Loss=0.1470 + throughput/total_tokens=111,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=583/500000] + train/ActionNoiseL2Loss=0.1077 + throughput/total_tokens=111,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=584/500000] + train/ActionNoiseL2Loss=0.2123 + throughput/total_tokens=112,128,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=585/500000] + train/ActionNoiseL2Loss=0.1789 + throughput/total_tokens=112,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=586/500000] + train/ActionNoiseL2Loss=0.1878 + throughput/total_tokens=112,512,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=587/500000] + train/ActionNoiseL2Loss=0.1520 + throughput/total_tokens=112,704,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=588/500000] + train/ActionNoiseL2Loss=0.2233 + throughput/total_tokens=112,896,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=589/500000] + train/ActionNoiseL2Loss=0.3060 + throughput/total_tokens=113,088,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=590/500000] + train/ActionNoiseL2Loss=0.2452 + throughput/total_tokens=113,280,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=591/500000] + train/ActionNoiseL2Loss=0.1282 + throughput/total_tokens=113,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=592/500000] + train/ActionNoiseL2Loss=0.1563 + throughput/total_tokens=113,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=593/500000] + train/ActionNoiseL2Loss=0.1824 + throughput/total_tokens=113,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=594/500000] + train/ActionNoiseL2Loss=0.2207 + throughput/total_tokens=114,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=595/500000] + train/ActionNoiseL2Loss=0.2320 + throughput/total_tokens=114,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=596/500000] + train/ActionNoiseL2Loss=0.1182 + throughput/total_tokens=114,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=597/500000] + train/ActionNoiseL2Loss=0.2645 + throughput/total_tokens=114,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=598/500000] + train/ActionNoiseL2Loss=0.1039 + throughput/total_tokens=114,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=599/500000] + train/ActionNoiseL2Loss=0.2579 + throughput/total_tokens=115,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=600/500000] + optim/total_grad_norm=3.921 + train/ActionNoiseL2Loss=0.1414 + throughput/total_tokens=115,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=601/500000] + train/ActionNoiseL2Loss=0.2233 + throughput/total_tokens=115,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=602/500000] + train/ActionNoiseL2Loss=0.1843 + throughput/total_tokens=115,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=603/500000] + train/ActionNoiseL2Loss=0.1092 + throughput/total_tokens=115,776,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=604/500000] + train/ActionNoiseL2Loss=0.1976 + throughput/total_tokens=115,968,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=605/500000] + train/ActionNoiseL2Loss=0.1639 + throughput/total_tokens=116,160,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=606/500000] + train/ActionNoiseL2Loss=0.1447 + throughput/total_tokens=116,352,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=607/500000] + train/ActionNoiseL2Loss=0.1785 + throughput/total_tokens=116,544,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=608/500000] + train/ActionNoiseL2Loss=0.1555 + throughput/total_tokens=116,736,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=609/500000] + train/ActionNoiseL2Loss=0.2122 + throughput/total_tokens=116,928,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=610/500000] + train/ActionNoiseL2Loss=0.1495 + throughput/total_tokens=117,120,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=611/500000] + train/ActionNoiseL2Loss=0.1678 + throughput/total_tokens=117,312,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=612/500000] + train/ActionNoiseL2Loss=0.1981 + throughput/total_tokens=117,504,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=613/500000] + train/ActionNoiseL2Loss=0.1169 + throughput/total_tokens=117,696,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=614/500000] + train/ActionNoiseL2Loss=0.1343 + throughput/total_tokens=117,888,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=615/500000] + train/ActionNoiseL2Loss=0.1274 + throughput/total_tokens=118,080,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=616/500000] + train/ActionNoiseL2Loss=0.2123 + throughput/total_tokens=118,272,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=617/500000] + train/ActionNoiseL2Loss=0.1338 + throughput/total_tokens=118,464,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=618/500000] + train/ActionNoiseL2Loss=0.1943 + throughput/total_tokens=118,656,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=619/500000] + train/ActionNoiseL2Loss=0.2354 + throughput/total_tokens=118,848,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=620/500000] + optim/total_grad_norm=3.718 + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=119,040,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=621/500000] + train/ActionNoiseL2Loss=0.1532 + throughput/total_tokens=119,232,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=622/500000] + train/ActionNoiseL2Loss=0.2126 + throughput/total_tokens=119,424,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=623/500000] + train/ActionNoiseL2Loss=0.1885 + throughput/total_tokens=119,616,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=624/500000] + train/ActionNoiseL2Loss=0.1761 + throughput/total_tokens=119,808,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=625/500000] + train/ActionNoiseL2Loss=0.2028 + throughput/total_tokens=120,000,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=626/500000] + train/ActionNoiseL2Loss=0.1124 + throughput/total_tokens=120,192,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=627/500000] + train/ActionNoiseL2Loss=0.1432 + throughput/total_tokens=120,384,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=628/500000] + train/ActionNoiseL2Loss=0.2545 + throughput/total_tokens=120,576,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=629/500000] + train/ActionNoiseL2Loss=0.2390 + throughput/total_tokens=120,768,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=630/500000] + train/ActionNoiseL2Loss=0.2125 + throughput/total_tokens=120,960,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=631/500000] + train/ActionNoiseL2Loss=0.1382 + throughput/total_tokens=121,152,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=632/500000] + train/ActionNoiseL2Loss=0.2573 + throughput/total_tokens=121,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=633/500000] + train/ActionNoiseL2Loss=0.1406 + throughput/total_tokens=121,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=634/500000] + train/ActionNoiseL2Loss=0.1633 + throughput/total_tokens=121,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=635/500000] + train/ActionNoiseL2Loss=0.1632 + throughput/total_tokens=121,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=636/500000] + train/ActionNoiseL2Loss=0.2668 + throughput/total_tokens=122,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=637/500000] + train/ActionNoiseL2Loss=0.1090 + throughput/total_tokens=122,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=638/500000] + train/ActionNoiseL2Loss=0.2536 + throughput/total_tokens=122,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=639/500000] + train/ActionNoiseL2Loss=0.1402 + throughput/total_tokens=122,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=640/500000] + optim/total_grad_norm=4.615 + train/ActionNoiseL2Loss=0.1416 + throughput/total_tokens=122,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=641/500000] + train/ActionNoiseL2Loss=0.2238 + throughput/total_tokens=123,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=642/500000] + train/ActionNoiseL2Loss=0.1920 + throughput/total_tokens=123,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=643/500000] + train/ActionNoiseL2Loss=0.1339 + throughput/total_tokens=123,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=644/500000] + train/ActionNoiseL2Loss=0.1964 + throughput/total_tokens=123,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=645/500000] + train/ActionNoiseL2Loss=0.1669 + throughput/total_tokens=123,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=646/500000] + train/ActionNoiseL2Loss=0.1902 + throughput/total_tokens=124,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=647/500000] + train/ActionNoiseL2Loss=0.1062 + throughput/total_tokens=124,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=648/500000] + train/ActionNoiseL2Loss=0.1244 + throughput/total_tokens=124,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=649/500000] + train/ActionNoiseL2Loss=0.1663 + throughput/total_tokens=124,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=650/500000] + train/ActionNoiseL2Loss=0.1225 + throughput/total_tokens=124,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=651/500000] + train/ActionNoiseL2Loss=0.0973 + throughput/total_tokens=124,992,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=652/500000] + train/ActionNoiseL2Loss=0.0879 + throughput/total_tokens=125,184,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=653/500000] + train/ActionNoiseL2Loss=0.1196 + throughput/total_tokens=125,376,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=654/500000] + train/ActionNoiseL2Loss=0.1669 + throughput/total_tokens=125,568,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=655/500000] + train/ActionNoiseL2Loss=0.1570 + throughput/total_tokens=125,760,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=656/500000] + train/ActionNoiseL2Loss=0.1188 + throughput/total_tokens=125,952,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=657/500000] + train/ActionNoiseL2Loss=0.1278 + throughput/total_tokens=126,144,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=658/500000] + train/ActionNoiseL2Loss=0.1376 + throughput/total_tokens=126,336,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=659/500000] + train/ActionNoiseL2Loss=0.1063 + throughput/total_tokens=126,528,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=660/500000] + optim/total_grad_norm=6.369 + train/ActionNoiseL2Loss=0.2234 + throughput/total_tokens=126,720,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=661/500000] + train/ActionNoiseL2Loss=0.2002 + throughput/total_tokens=126,912,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=662/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=127,104,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=663/500000] + train/ActionNoiseL2Loss=0.1600 + throughput/total_tokens=127,296,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=664/500000] + train/ActionNoiseL2Loss=0.3134 + throughput/total_tokens=127,488,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=665/500000] + train/ActionNoiseL2Loss=0.1834 + throughput/total_tokens=127,680,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=666/500000] + train/ActionNoiseL2Loss=0.1516 + throughput/total_tokens=127,872,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=667/500000] + train/ActionNoiseL2Loss=0.2602 + throughput/total_tokens=128,064,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=668/500000] + train/ActionNoiseL2Loss=0.0970 + throughput/total_tokens=128,256,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=669/500000] + train/ActionNoiseL2Loss=0.1228 + throughput/total_tokens=128,448,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=670/500000] + train/ActionNoiseL2Loss=0.2461 + throughput/total_tokens=128,640,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=671/500000] + train/ActionNoiseL2Loss=0.1076 + throughput/total_tokens=128,832,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=672/500000] + train/ActionNoiseL2Loss=0.1103 + throughput/total_tokens=129,024,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=673/500000] + train/ActionNoiseL2Loss=0.1516 + throughput/total_tokens=129,216,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=674/500000] + train/ActionNoiseL2Loss=0.1350 + throughput/total_tokens=129,408,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=675/500000] + train/ActionNoiseL2Loss=0.1756 + throughput/total_tokens=129,600,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=676/500000] + train/ActionNoiseL2Loss=0.1386 + throughput/total_tokens=129,792,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=677/500000] + train/ActionNoiseL2Loss=0.1383 + throughput/total_tokens=129,984,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=678/500000] + train/ActionNoiseL2Loss=0.1301 + throughput/total_tokens=130,176,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=679/500000] + train/ActionNoiseL2Loss=0.1765 + throughput/total_tokens=130,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=680/500000] + optim/total_grad_norm=9.441 + train/ActionNoiseL2Loss=0.2595 + throughput/total_tokens=130,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=681/500000] + train/ActionNoiseL2Loss=0.2091 + throughput/total_tokens=130,752,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=682/500000] + train/ActionNoiseL2Loss=0.1685 + throughput/total_tokens=130,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=683/500000] + train/ActionNoiseL2Loss=0.1362 + throughput/total_tokens=131,136,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=684/500000] + train/ActionNoiseL2Loss=0.2247 + throughput/total_tokens=131,328,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=685/500000] + train/ActionNoiseL2Loss=0.1543 + throughput/total_tokens=131,520,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=686/500000] + train/ActionNoiseL2Loss=0.1448 + throughput/total_tokens=131,712,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=687/500000] + train/ActionNoiseL2Loss=0.0983 + throughput/total_tokens=131,904,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=688/500000] + train/ActionNoiseL2Loss=0.1761 + throughput/total_tokens=132,096,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=689/500000] + train/ActionNoiseL2Loss=0.1348 + throughput/total_tokens=132,288,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=690/500000] + train/ActionNoiseL2Loss=0.2134 + throughput/total_tokens=132,480,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=691/500000] + train/ActionNoiseL2Loss=0.1268 + throughput/total_tokens=132,672,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=692/500000] + train/ActionNoiseL2Loss=0.1915 + throughput/total_tokens=132,864,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=693/500000] + train/ActionNoiseL2Loss=0.2120 + throughput/total_tokens=133,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=694/500000] + train/ActionNoiseL2Loss=0.1044 + throughput/total_tokens=133,248,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=695/500000] + train/ActionNoiseL2Loss=0.1064 + throughput/total_tokens=133,440,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=696/500000] + train/ActionNoiseL2Loss=0.2788 + throughput/total_tokens=133,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=697/500000] + train/ActionNoiseL2Loss=0.1580 + throughput/total_tokens=133,824,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=698/500000] + train/ActionNoiseL2Loss=0.1147 + throughput/total_tokens=134,016,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=699/500000] + train/ActionNoiseL2Loss=0.1904 + throughput/total_tokens=134,208,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=700/500000] + optim/total_grad_norm=5.636 + train/ActionNoiseL2Loss=0.1582 + throughput/total_tokens=134,400,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=701/500000] + train/ActionNoiseL2Loss=0.1163 + throughput/total_tokens=134,592,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=702/500000] + train/ActionNoiseL2Loss=0.1733 + throughput/total_tokens=134,784,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=703/500000] + train/ActionNoiseL2Loss=0.1328 + throughput/total_tokens=134,976,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=704/500000] + train/ActionNoiseL2Loss=0.1399 + throughput/total_tokens=135,168,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=705/500000] + train/ActionNoiseL2Loss=0.1371 + throughput/total_tokens=135,360,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=706/500000] + train/ActionNoiseL2Loss=0.1263 + throughput/total_tokens=135,552,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=707/500000] + train/ActionNoiseL2Loss=0.1612 + throughput/total_tokens=135,744,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=708/500000] + train/ActionNoiseL2Loss=0.1757 + throughput/total_tokens=135,936,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=709/500000] + train/ActionNoiseL2Loss=0.1528 + throughput/total_tokens=136,128,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=710/500000] + train/ActionNoiseL2Loss=0.1618 + throughput/total_tokens=136,320,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=711/500000] + train/ActionNoiseL2Loss=0.1354 + throughput/total_tokens=136,512,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=712/500000] + train/ActionNoiseL2Loss=0.0937 + throughput/total_tokens=136,704,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=713/500000] + train/ActionNoiseL2Loss=0.1743 + throughput/total_tokens=136,896,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=714/500000] + train/ActionNoiseL2Loss=0.1542 + throughput/total_tokens=137,088,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=715/500000] + train/ActionNoiseL2Loss=0.1349 + throughput/total_tokens=137,280,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=716/500000] + train/ActionNoiseL2Loss=0.0988 + throughput/total_tokens=137,472,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=717/500000] + train/ActionNoiseL2Loss=0.1624 + throughput/total_tokens=137,664,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=718/500000] + train/ActionNoiseL2Loss=0.1749 + throughput/total_tokens=137,856,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=719/500000] + train/ActionNoiseL2Loss=0.0911 + throughput/total_tokens=138,048,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=720/500000] + optim/total_grad_norm=6.383 + train/ActionNoiseL2Loss=0.1838 + throughput/total_tokens=138,240,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=721/500000] + train/ActionNoiseL2Loss=0.1514 + throughput/total_tokens=138,432,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=722/500000] + train/ActionNoiseL2Loss=0.1024 + throughput/total_tokens=138,624,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=723/500000] + train/ActionNoiseL2Loss=0.2342 + throughput/total_tokens=138,816,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=724/500000] + train/ActionNoiseL2Loss=0.1562 + throughput/total_tokens=139,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=725/500000] + train/ActionNoiseL2Loss=0.1046 + throughput/total_tokens=139,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=726/500000] + train/ActionNoiseL2Loss=0.1318 + throughput/total_tokens=139,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=727/500000] + train/ActionNoiseL2Loss=0.2151 + throughput/total_tokens=139,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=728/500000] + train/ActionNoiseL2Loss=0.1980 + throughput/total_tokens=139,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=729/500000] + train/ActionNoiseL2Loss=0.1526 + throughput/total_tokens=139,968,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=730/500000] + train/ActionNoiseL2Loss=0.1202 + throughput/total_tokens=140,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=731/500000] + train/ActionNoiseL2Loss=0.1030 + throughput/total_tokens=140,352,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=732/500000] + train/ActionNoiseL2Loss=0.1077 + throughput/total_tokens=140,544,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=733/500000] + train/ActionNoiseL2Loss=0.1968 + throughput/total_tokens=140,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=734/500000] + train/ActionNoiseL2Loss=0.1658 + throughput/total_tokens=140,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=735/500000] + train/ActionNoiseL2Loss=0.1119 + throughput/total_tokens=141,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=736/500000] + train/ActionNoiseL2Loss=0.1110 + throughput/total_tokens=141,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=737/500000] + train/ActionNoiseL2Loss=0.1139 + throughput/total_tokens=141,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=738/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=141,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=739/500000] + train/ActionNoiseL2Loss=0.1986 + throughput/total_tokens=141,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=740/500000] + optim/total_grad_norm=4.548 + train/ActionNoiseL2Loss=0.1576 + throughput/total_tokens=142,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=741/500000] + train/ActionNoiseL2Loss=0.1753 + throughput/total_tokens=142,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=742/500000] + train/ActionNoiseL2Loss=0.0961 + throughput/total_tokens=142,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=743/500000] + train/ActionNoiseL2Loss=0.1273 + throughput/total_tokens=142,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=744/500000] + train/ActionNoiseL2Loss=0.1466 + throughput/total_tokens=142,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=745/500000] + train/ActionNoiseL2Loss=0.0914 + throughput/total_tokens=143,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=746/500000] + train/ActionNoiseL2Loss=0.1167 + throughput/total_tokens=143,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=747/500000] + train/ActionNoiseL2Loss=0.1665 + throughput/total_tokens=143,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=748/500000] + train/ActionNoiseL2Loss=0.1074 + throughput/total_tokens=143,616,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=749/500000] + train/ActionNoiseL2Loss=0.1331 + throughput/total_tokens=143,808,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=750/500000] + train/ActionNoiseL2Loss=0.1401 + throughput/total_tokens=144,000,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=751/500000] + train/ActionNoiseL2Loss=0.1687 + throughput/total_tokens=144,192,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=752/500000] + train/ActionNoiseL2Loss=0.1778 + throughput/total_tokens=144,384,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=753/500000] + train/ActionNoiseL2Loss=0.1414 + throughput/total_tokens=144,576,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=754/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=144,768,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=755/500000] + train/ActionNoiseL2Loss=0.1060 + throughput/total_tokens=144,960,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=756/500000] + train/ActionNoiseL2Loss=0.1956 + throughput/total_tokens=145,152,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=757/500000] + train/ActionNoiseL2Loss=0.1385 + throughput/total_tokens=145,344,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=758/500000] + train/ActionNoiseL2Loss=0.1279 + throughput/total_tokens=145,536,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=759/500000] + train/ActionNoiseL2Loss=0.1328 + throughput/total_tokens=145,728,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=760/500000] + optim/total_grad_norm=6.918 + train/ActionNoiseL2Loss=0.2698 + throughput/total_tokens=145,920,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=761/500000] + train/ActionNoiseL2Loss=0.1237 + throughput/total_tokens=146,112,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=762/500000] + train/ActionNoiseL2Loss=0.2373 + throughput/total_tokens=146,304,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=763/500000] + train/ActionNoiseL2Loss=0.1391 + throughput/total_tokens=146,496,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=764/500000] + train/ActionNoiseL2Loss=0.1548 + throughput/total_tokens=146,688,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=765/500000] + train/ActionNoiseL2Loss=0.1379 + throughput/total_tokens=146,880,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=766/500000] + train/ActionNoiseL2Loss=0.1478 + throughput/total_tokens=147,072,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=767/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=147,264,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=768/500000] + train/ActionNoiseL2Loss=0.1343 + throughput/total_tokens=147,456,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=769/500000] + train/ActionNoiseL2Loss=0.1007 + throughput/total_tokens=147,648,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=770/500000] + train/ActionNoiseL2Loss=0.1797 + throughput/total_tokens=147,840,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=771/500000] + train/ActionNoiseL2Loss=0.1405 + throughput/total_tokens=148,032,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=772/500000] + train/ActionNoiseL2Loss=0.0984 + throughput/total_tokens=148,224,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=773/500000] + train/ActionNoiseL2Loss=0.1454 + throughput/total_tokens=148,416,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=774/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=148,608,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=775/500000] + train/ActionNoiseL2Loss=0.1159 + throughput/total_tokens=148,800,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=776/500000] + train/ActionNoiseL2Loss=0.2240 + throughput/total_tokens=148,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=777/500000] + train/ActionNoiseL2Loss=0.1855 + throughput/total_tokens=149,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=778/500000] + train/ActionNoiseL2Loss=0.2365 + throughput/total_tokens=149,376,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=779/500000] + train/ActionNoiseL2Loss=0.2190 + throughput/total_tokens=149,568,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=780/500000] + optim/total_grad_norm=7.733 + train/ActionNoiseL2Loss=0.2293 + throughput/total_tokens=149,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=781/500000] + train/ActionNoiseL2Loss=0.1383 + throughput/total_tokens=149,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=782/500000] + train/ActionNoiseL2Loss=0.2444 + throughput/total_tokens=150,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=783/500000] + train/ActionNoiseL2Loss=0.2187 + throughput/total_tokens=150,336,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=784/500000] + train/ActionNoiseL2Loss=0.1520 + throughput/total_tokens=150,528,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=785/500000] + train/ActionNoiseL2Loss=0.1017 + throughput/total_tokens=150,720,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=786/500000] + train/ActionNoiseL2Loss=0.1105 + throughput/total_tokens=150,912,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=787/500000] + train/ActionNoiseL2Loss=0.1933 + throughput/total_tokens=151,104,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=788/500000] + train/ActionNoiseL2Loss=0.1637 + throughput/total_tokens=151,296,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=789/500000] + train/ActionNoiseL2Loss=0.1945 + throughput/total_tokens=151,488,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=790/500000] + train/ActionNoiseL2Loss=0.1081 + throughput/total_tokens=151,680,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=791/500000] + train/ActionNoiseL2Loss=0.2110 + throughput/total_tokens=151,872,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=792/500000] + train/ActionNoiseL2Loss=0.1598 + throughput/total_tokens=152,064,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=793/500000] + train/ActionNoiseL2Loss=0.1572 + throughput/total_tokens=152,256,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=794/500000] + train/ActionNoiseL2Loss=0.1884 + throughput/total_tokens=152,448,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=795/500000] + train/ActionNoiseL2Loss=0.1655 + throughput/total_tokens=152,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=796/500000] + train/ActionNoiseL2Loss=0.2308 + throughput/total_tokens=152,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=797/500000] + train/ActionNoiseL2Loss=0.1365 + throughput/total_tokens=153,024,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=798/500000] + train/ActionNoiseL2Loss=0.1576 + throughput/total_tokens=153,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=799/500000] + train/ActionNoiseL2Loss=0.1318 + throughput/total_tokens=153,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=800/500000] + optim/total_grad_norm=4.881 + train/ActionNoiseL2Loss=0.1214 + throughput/total_tokens=153,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=801/500000] + train/ActionNoiseL2Loss=0.1525 + throughput/total_tokens=153,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=802/500000] + train/ActionNoiseL2Loss=0.1443 + throughput/total_tokens=153,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=803/500000] + train/ActionNoiseL2Loss=0.1499 + throughput/total_tokens=154,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=804/500000] + train/ActionNoiseL2Loss=0.1189 + throughput/total_tokens=154,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=805/500000] + train/ActionNoiseL2Loss=0.1459 + throughput/total_tokens=154,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=806/500000] + train/ActionNoiseL2Loss=0.1097 + throughput/total_tokens=154,752,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=807/500000] + train/ActionNoiseL2Loss=0.1314 + throughput/total_tokens=154,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=808/500000] + train/ActionNoiseL2Loss=0.1102 + throughput/total_tokens=155,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=809/500000] + train/ActionNoiseL2Loss=0.1029 + throughput/total_tokens=155,328,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=810/500000] + train/ActionNoiseL2Loss=0.1141 + throughput/total_tokens=155,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=811/500000] + train/ActionNoiseL2Loss=0.0853 + throughput/total_tokens=155,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=812/500000] + train/ActionNoiseL2Loss=0.2037 + throughput/total_tokens=155,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=813/500000] + train/ActionNoiseL2Loss=0.1696 + throughput/total_tokens=156,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=814/500000] + train/ActionNoiseL2Loss=0.1148 + throughput/total_tokens=156,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=815/500000] + train/ActionNoiseL2Loss=0.1093 + throughput/total_tokens=156,480,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=816/500000] + train/ActionNoiseL2Loss=0.1774 + throughput/total_tokens=156,672,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=817/500000] + train/ActionNoiseL2Loss=0.1773 + throughput/total_tokens=156,864,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=818/500000] + train/ActionNoiseL2Loss=0.1603 + throughput/total_tokens=157,056,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=819/500000] + train/ActionNoiseL2Loss=0.0858 + throughput/total_tokens=157,248,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=820/500000] + optim/total_grad_norm=4.206 + train/ActionNoiseL2Loss=0.1036 + throughput/total_tokens=157,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=821/500000] + train/ActionNoiseL2Loss=0.2081 + throughput/total_tokens=157,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=822/500000] + train/ActionNoiseL2Loss=0.1107 + throughput/total_tokens=157,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=823/500000] + train/ActionNoiseL2Loss=0.1394 + throughput/total_tokens=158,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=824/500000] + train/ActionNoiseL2Loss=0.1607 + throughput/total_tokens=158,208,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=825/500000] + train/ActionNoiseL2Loss=0.2005 + throughput/total_tokens=158,400,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=826/500000] + train/ActionNoiseL2Loss=0.1935 + throughput/total_tokens=158,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=827/500000] + train/ActionNoiseL2Loss=0.1837 + throughput/total_tokens=158,784,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=828/500000] + train/ActionNoiseL2Loss=0.1284 + throughput/total_tokens=158,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=829/500000] + train/ActionNoiseL2Loss=0.1164 + throughput/total_tokens=159,168,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=830/500000] + train/ActionNoiseL2Loss=0.1086 + throughput/total_tokens=159,360,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=831/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=159,552,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=832/500000] + train/ActionNoiseL2Loss=0.1198 + throughput/total_tokens=159,744,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=833/500000] + train/ActionNoiseL2Loss=0.2139 + throughput/total_tokens=159,936,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=834/500000] + train/ActionNoiseL2Loss=0.1906 + throughput/total_tokens=160,128,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=835/500000] + train/ActionNoiseL2Loss=0.1634 + throughput/total_tokens=160,320,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=836/500000] + train/ActionNoiseL2Loss=0.1281 + throughput/total_tokens=160,512,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=837/500000] + train/ActionNoiseL2Loss=0.1427 + throughput/total_tokens=160,704,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=838/500000] + train/ActionNoiseL2Loss=0.1198 + throughput/total_tokens=160,896,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=839/500000] + train/ActionNoiseL2Loss=0.1485 + throughput/total_tokens=161,088,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=840/500000] + optim/total_grad_norm=3.456 + train/ActionNoiseL2Loss=0.0926 + throughput/total_tokens=161,280,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=841/500000] + train/ActionNoiseL2Loss=0.2200 + throughput/total_tokens=161,472,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=842/500000] + train/ActionNoiseL2Loss=0.1221 + throughput/total_tokens=161,664,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=843/500000] + train/ActionNoiseL2Loss=0.1186 + throughput/total_tokens=161,856,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=844/500000] + train/ActionNoiseL2Loss=0.1306 + throughput/total_tokens=162,048,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=845/500000] + train/ActionNoiseL2Loss=0.1165 + throughput/total_tokens=162,240,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=846/500000] + train/ActionNoiseL2Loss=0.1400 + throughput/total_tokens=162,432,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=847/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=162,624,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=848/500000] + train/ActionNoiseL2Loss=0.1417 + throughput/total_tokens=162,816,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=849/500000] + train/ActionNoiseL2Loss=0.1859 + throughput/total_tokens=163,008,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=850/500000] + train/ActionNoiseL2Loss=0.1387 + throughput/total_tokens=163,200,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=851/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=163,392,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=852/500000] + train/ActionNoiseL2Loss=0.1677 + throughput/total_tokens=163,584,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=853/500000] + train/ActionNoiseL2Loss=0.1268 + throughput/total_tokens=163,776,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=854/500000] + train/ActionNoiseL2Loss=0.1420 + throughput/total_tokens=163,968,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=855/500000] + train/ActionNoiseL2Loss=0.2263 + throughput/total_tokens=164,160,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=856/500000] + train/ActionNoiseL2Loss=0.1452 + throughput/total_tokens=164,352,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=857/500000] + train/ActionNoiseL2Loss=0.1151 + throughput/total_tokens=164,544,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=858/500000] + train/ActionNoiseL2Loss=0.1279 + throughput/total_tokens=164,736,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=859/500000] + train/ActionNoiseL2Loss=0.3148 + throughput/total_tokens=164,928,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=860/500000] + optim/total_grad_norm=5.956 + train/ActionNoiseL2Loss=0.2201 + throughput/total_tokens=165,120,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=861/500000] + train/ActionNoiseL2Loss=0.1913 + throughput/total_tokens=165,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=862/500000] + train/ActionNoiseL2Loss=0.1157 + throughput/total_tokens=165,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=863/500000] + train/ActionNoiseL2Loss=0.2075 + throughput/total_tokens=165,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=864/500000] + train/ActionNoiseL2Loss=0.1981 + throughput/total_tokens=165,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=865/500000] + train/ActionNoiseL2Loss=0.1725 + throughput/total_tokens=166,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=866/500000] + train/ActionNoiseL2Loss=0.3409 + throughput/total_tokens=166,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=867/500000] + train/ActionNoiseL2Loss=0.1746 + throughput/total_tokens=166,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=868/500000] + train/ActionNoiseL2Loss=0.1256 + throughput/total_tokens=166,656,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=869/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=166,848,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=870/500000] + train/ActionNoiseL2Loss=0.1590 + throughput/total_tokens=167,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=871/500000] + train/ActionNoiseL2Loss=0.0977 + throughput/total_tokens=167,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=872/500000] + train/ActionNoiseL2Loss=0.2058 + throughput/total_tokens=167,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=873/500000] + train/ActionNoiseL2Loss=0.1099 + throughput/total_tokens=167,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=874/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=167,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=875/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=168,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=876/500000] + train/ActionNoiseL2Loss=0.1209 + throughput/total_tokens=168,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=877/500000] + train/ActionNoiseL2Loss=0.1574 + throughput/total_tokens=168,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=878/500000] + train/ActionNoiseL2Loss=0.1856 + throughput/total_tokens=168,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=879/500000] + train/ActionNoiseL2Loss=0.1358 + throughput/total_tokens=168,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=880/500000] + optim/total_grad_norm=3.996 + train/ActionNoiseL2Loss=0.1317 + throughput/total_tokens=168,960,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=881/500000] + train/ActionNoiseL2Loss=0.1078 + throughput/total_tokens=169,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=882/500000] + train/ActionNoiseL2Loss=0.1975 + throughput/total_tokens=169,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=883/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=169,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=884/500000] + train/ActionNoiseL2Loss=0.1211 + throughput/total_tokens=169,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=885/500000] + train/ActionNoiseL2Loss=0.1022 + throughput/total_tokens=169,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=886/500000] + train/ActionNoiseL2Loss=0.1016 + throughput/total_tokens=170,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=887/500000] + train/ActionNoiseL2Loss=0.1509 + throughput/total_tokens=170,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=888/500000] + train/ActionNoiseL2Loss=0.2164 + throughput/total_tokens=170,496,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=889/500000] + train/ActionNoiseL2Loss=0.0939 + throughput/total_tokens=170,688,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=890/500000] + train/ActionNoiseL2Loss=0.1346 + throughput/total_tokens=170,880,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=891/500000] + train/ActionNoiseL2Loss=0.1811 + throughput/total_tokens=171,072,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=892/500000] + train/ActionNoiseL2Loss=0.1216 + throughput/total_tokens=171,264,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=893/500000] + train/ActionNoiseL2Loss=0.1193 + throughput/total_tokens=171,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=894/500000] + train/ActionNoiseL2Loss=0.1188 + throughput/total_tokens=171,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=895/500000] + train/ActionNoiseL2Loss=0.1811 + throughput/total_tokens=171,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=896/500000] + train/ActionNoiseL2Loss=0.1507 + throughput/total_tokens=172,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=897/500000] + train/ActionNoiseL2Loss=0.1480 + throughput/total_tokens=172,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=898/500000] + train/ActionNoiseL2Loss=0.1082 + throughput/total_tokens=172,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=899/500000] + train/ActionNoiseL2Loss=0.1309 + throughput/total_tokens=172,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=900/500000] + optim/total_grad_norm=2.402 + train/ActionNoiseL2Loss=0.0972 + throughput/total_tokens=172,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=901/500000] + train/ActionNoiseL2Loss=0.1059 + throughput/total_tokens=172,992,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=902/500000] + train/ActionNoiseL2Loss=0.1459 + throughput/total_tokens=173,184,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=903/500000] + train/ActionNoiseL2Loss=0.1020 + throughput/total_tokens=173,376,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=904/500000] + train/ActionNoiseL2Loss=0.0987 + throughput/total_tokens=173,568,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=905/500000] + train/ActionNoiseL2Loss=0.1192 + throughput/total_tokens=173,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=906/500000] + train/ActionNoiseL2Loss=0.1601 + throughput/total_tokens=173,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=907/500000] + train/ActionNoiseL2Loss=0.1231 + throughput/total_tokens=174,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=908/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=174,336,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=909/500000] + train/ActionNoiseL2Loss=0.1356 + throughput/total_tokens=174,528,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=910/500000] + train/ActionNoiseL2Loss=0.1022 + throughput/total_tokens=174,720,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=911/500000] + train/ActionNoiseL2Loss=0.1394 + throughput/total_tokens=174,912,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=912/500000] + train/ActionNoiseL2Loss=0.1333 + throughput/total_tokens=175,104,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=913/500000] + train/ActionNoiseL2Loss=0.1293 + throughput/total_tokens=175,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=914/500000] + train/ActionNoiseL2Loss=0.1309 + throughput/total_tokens=175,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=915/500000] + train/ActionNoiseL2Loss=0.1581 + throughput/total_tokens=175,680,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=916/500000] + train/ActionNoiseL2Loss=0.0809 + throughput/total_tokens=175,872,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=917/500000] + train/ActionNoiseL2Loss=0.1273 + throughput/total_tokens=176,064,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=918/500000] + train/ActionNoiseL2Loss=0.1130 + throughput/total_tokens=176,256,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=919/500000] + train/ActionNoiseL2Loss=0.1029 + throughput/total_tokens=176,448,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=920/500000] + optim/total_grad_norm=4.727 + train/ActionNoiseL2Loss=0.1679 + throughput/total_tokens=176,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=921/500000] + train/ActionNoiseL2Loss=0.0993 + throughput/total_tokens=176,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=922/500000] + train/ActionNoiseL2Loss=0.1623 + throughput/total_tokens=177,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=923/500000] + train/ActionNoiseL2Loss=0.1767 + throughput/total_tokens=177,216,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=924/500000] + train/ActionNoiseL2Loss=0.1155 + throughput/total_tokens=177,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=925/500000] + train/ActionNoiseL2Loss=0.1225 + throughput/total_tokens=177,600,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=926/500000] + train/ActionNoiseL2Loss=0.1612 + throughput/total_tokens=177,792,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=927/500000] + train/ActionNoiseL2Loss=0.1413 + throughput/total_tokens=177,984,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=928/500000] + train/ActionNoiseL2Loss=0.1217 + throughput/total_tokens=178,176,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=929/500000] + train/ActionNoiseL2Loss=0.1660 + throughput/total_tokens=178,368,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=930/500000] + train/ActionNoiseL2Loss=0.1755 + throughput/total_tokens=178,560,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=931/500000] + train/ActionNoiseL2Loss=0.2330 + throughput/total_tokens=178,752,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=932/500000] + train/ActionNoiseL2Loss=0.1350 + throughput/total_tokens=178,944,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=933/500000] + train/ActionNoiseL2Loss=0.2132 + throughput/total_tokens=179,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=934/500000] + train/ActionNoiseL2Loss=0.1693 + throughput/total_tokens=179,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=935/500000] + train/ActionNoiseL2Loss=0.1488 + throughput/total_tokens=179,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=936/500000] + train/ActionNoiseL2Loss=0.1275 + throughput/total_tokens=179,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=937/500000] + train/ActionNoiseL2Loss=0.0954 + throughput/total_tokens=179,904,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=938/500000] + train/ActionNoiseL2Loss=0.1058 + throughput/total_tokens=180,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=939/500000] + train/ActionNoiseL2Loss=0.1220 + throughput/total_tokens=180,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=940/500000] + optim/total_grad_norm=3.538 + train/ActionNoiseL2Loss=0.1462 + throughput/total_tokens=180,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=941/500000] + train/ActionNoiseL2Loss=0.1248 + throughput/total_tokens=180,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=942/500000] + train/ActionNoiseL2Loss=0.2339 + throughput/total_tokens=180,864,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=943/500000] + train/ActionNoiseL2Loss=0.1086 + throughput/total_tokens=181,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=944/500000] + train/ActionNoiseL2Loss=0.1528 + throughput/total_tokens=181,248,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=945/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=181,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=946/500000] + train/ActionNoiseL2Loss=0.1499 + throughput/total_tokens=181,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=947/500000] + train/ActionNoiseL2Loss=0.1026 + throughput/total_tokens=181,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=948/500000] + train/ActionNoiseL2Loss=0.0994 + throughput/total_tokens=182,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=949/500000] + train/ActionNoiseL2Loss=0.1143 + throughput/total_tokens=182,208,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=950/500000] + train/ActionNoiseL2Loss=0.1279 + throughput/total_tokens=182,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=951/500000] + train/ActionNoiseL2Loss=0.1238 + throughput/total_tokens=182,592,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=952/500000] + train/ActionNoiseL2Loss=0.1161 + throughput/total_tokens=182,784,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=953/500000] + train/ActionNoiseL2Loss=0.1123 + throughput/total_tokens=182,976,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=954/500000] + train/ActionNoiseL2Loss=0.1786 + throughput/total_tokens=183,168,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=955/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=183,360,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=956/500000] + train/ActionNoiseL2Loss=0.2818 + throughput/total_tokens=183,552,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=957/500000] + train/ActionNoiseL2Loss=0.1753 + throughput/total_tokens=183,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=958/500000] + train/ActionNoiseL2Loss=0.2083 + throughput/total_tokens=183,936,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=959/500000] + train/ActionNoiseL2Loss=0.1064 + throughput/total_tokens=184,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=960/500000] + optim/total_grad_norm=5.005 + train/ActionNoiseL2Loss=0.1364 + throughput/total_tokens=184,320,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=961/500000] + train/ActionNoiseL2Loss=0.1365 + throughput/total_tokens=184,512,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=962/500000] + train/ActionNoiseL2Loss=0.1343 + throughput/total_tokens=184,704,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=963/500000] + train/ActionNoiseL2Loss=0.1379 + throughput/total_tokens=184,896,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=964/500000] + train/ActionNoiseL2Loss=0.1226 + throughput/total_tokens=185,088,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=965/500000] + train/ActionNoiseL2Loss=0.1860 + throughput/total_tokens=185,280,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=966/500000] + train/ActionNoiseL2Loss=0.1256 + throughput/total_tokens=185,472,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=967/500000] + train/ActionNoiseL2Loss=0.1707 + throughput/total_tokens=185,664,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=968/500000] + train/ActionNoiseL2Loss=0.1766 + throughput/total_tokens=185,856,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=969/500000] + train/ActionNoiseL2Loss=0.1599 + throughput/total_tokens=186,048,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=970/500000] + train/ActionNoiseL2Loss=0.2115 + throughput/total_tokens=186,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=971/500000] + train/ActionNoiseL2Loss=0.1383 + throughput/total_tokens=186,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=972/500000] + train/ActionNoiseL2Loss=0.0963 + throughput/total_tokens=186,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=973/500000] + train/ActionNoiseL2Loss=0.1198 + throughput/total_tokens=186,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=974/500000] + train/ActionNoiseL2Loss=0.1799 + throughput/total_tokens=187,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=975/500000] + train/ActionNoiseL2Loss=0.1841 + throughput/total_tokens=187,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=976/500000] + train/ActionNoiseL2Loss=0.1656 + throughput/total_tokens=187,392,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=977/500000] + train/ActionNoiseL2Loss=0.1379 + throughput/total_tokens=187,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=978/500000] + train/ActionNoiseL2Loss=0.2002 + throughput/total_tokens=187,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=979/500000] + train/ActionNoiseL2Loss=0.0902 + throughput/total_tokens=187,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=980/500000] + optim/total_grad_norm=3.278 + train/ActionNoiseL2Loss=0.1251 + throughput/total_tokens=188,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=981/500000] + train/ActionNoiseL2Loss=0.1840 + throughput/total_tokens=188,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=982/500000] + train/ActionNoiseL2Loss=0.1260 + throughput/total_tokens=188,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=983/500000] + train/ActionNoiseL2Loss=0.1267 + throughput/total_tokens=188,736,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=984/500000] + train/ActionNoiseL2Loss=0.1250 + throughput/total_tokens=188,928,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=985/500000] + train/ActionNoiseL2Loss=0.1167 + throughput/total_tokens=189,120,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=986/500000] + train/ActionNoiseL2Loss=0.1180 + throughput/total_tokens=189,312,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=987/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=189,504,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=988/500000] + train/ActionNoiseL2Loss=0.1755 + throughput/total_tokens=189,696,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=989/500000] + train/ActionNoiseL2Loss=0.1244 + throughput/total_tokens=189,888,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=990/500000] + train/ActionNoiseL2Loss=0.0994 + throughput/total_tokens=190,080,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=991/500000] + train/ActionNoiseL2Loss=0.1032 + throughput/total_tokens=190,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=992/500000] + train/ActionNoiseL2Loss=0.1105 + throughput/total_tokens=190,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=993/500000] + train/ActionNoiseL2Loss=0.1633 + throughput/total_tokens=190,656,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=994/500000] + train/ActionNoiseL2Loss=0.2019 + throughput/total_tokens=190,848,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=995/500000] + train/ActionNoiseL2Loss=0.0853 + throughput/total_tokens=191,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=996/500000] + train/ActionNoiseL2Loss=0.2068 + throughput/total_tokens=191,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=997/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=191,424,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=998/500000] + train/ActionNoiseL2Loss=0.1515 + throughput/total_tokens=191,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=999/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=191,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1000/500000] + optim/total_grad_norm=4.345 + train/ActionNoiseL2Loss=0.1499 + throughput/total_tokens=192,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +10/11 [22:35:03] INFO | >> Saving config... checkpoint.py:608 +10/11 [22:35:47] INFO | >> Saving model state... checkpoint.py:796 +10/11 [22:37:01] INFO | >> Saving optim state... checkpoint.py:811 +10/11 [22:38:32] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=1001/500000] + train/ActionNoiseL2Loss=0.2167 + throughput/total_tokens=192,192,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=1002/500000] + train/ActionNoiseL2Loss=0.1557 + throughput/total_tokens=192,384,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=1003/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=192,576,000 + throughput/device/tokens_per_second=1,102 + throughput/device/batches_per_second=0.0460 +[step=1004/500000] + train/ActionNoiseL2Loss=0.1126 + throughput/total_tokens=192,768,000 + throughput/device/tokens_per_second=1,109 + throughput/device/batches_per_second=0.0462 +[step=1005/500000] + train/ActionNoiseL2Loss=0.1221 + throughput/total_tokens=192,960,000 + throughput/device/tokens_per_second=1,117 + throughput/device/batches_per_second=0.0466 +[step=1006/500000] + train/ActionNoiseL2Loss=0.1028 + throughput/total_tokens=193,152,000 + throughput/device/tokens_per_second=1,122 + throughput/device/batches_per_second=0.0468 +[step=1007/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=193,344,000 + throughput/device/tokens_per_second=1,125 + throughput/device/batches_per_second=0.0469 +[step=1008/500000] + train/ActionNoiseL2Loss=0.1425 + throughput/total_tokens=193,536,000 + throughput/device/tokens_per_second=1,128 + throughput/device/batches_per_second=0.0470 +[step=1009/500000] + train/ActionNoiseL2Loss=0.1531 + throughput/total_tokens=193,728,000 + throughput/device/tokens_per_second=1,131 + throughput/device/batches_per_second=0.0471 +[step=1010/500000] + train/ActionNoiseL2Loss=0.1232 + throughput/total_tokens=193,920,000 + throughput/device/tokens_per_second=1,132 + throughput/device/batches_per_second=0.0472 + System/Peak GPU Memory (MB)=51,076 +[step=1011/500000] + train/ActionNoiseL2Loss=0.1169 + throughput/total_tokens=194,112,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=1012/500000] + train/ActionNoiseL2Loss=0.1824 + throughput/total_tokens=194,304,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=1013/500000] + train/ActionNoiseL2Loss=0.1228 + throughput/total_tokens=194,496,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=1014/500000] + train/ActionNoiseL2Loss=0.1620 + throughput/total_tokens=194,688,000 + throughput/device/tokens_per_second=1,137 + throughput/device/batches_per_second=0.0474 +[step=1015/500000] + train/ActionNoiseL2Loss=0.1710 + throughput/total_tokens=194,880,000 + throughput/device/tokens_per_second=1,137 + throughput/device/batches_per_second=0.0474 +[step=1016/500000] + train/ActionNoiseL2Loss=0.1462 + throughput/total_tokens=195,072,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0474 +[step=1017/500000] + train/ActionNoiseL2Loss=0.2017 + throughput/total_tokens=195,264,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=1018/500000] + train/ActionNoiseL2Loss=0.1372 + throughput/total_tokens=195,456,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=1019/500000] + train/ActionNoiseL2Loss=0.1244 + throughput/total_tokens=195,648,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=1020/500000] + optim/total_grad_norm=5.606 + train/ActionNoiseL2Loss=0.1552 + throughput/total_tokens=195,840,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 + System/Peak GPU Memory (MB)=51,076 +[step=1021/500000] + train/ActionNoiseL2Loss=0.1568 + throughput/total_tokens=196,032,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0475 +[step=1022/500000] + train/ActionNoiseL2Loss=0.1016 + throughput/total_tokens=196,224,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=1023/500000] + train/ActionNoiseL2Loss=0.1115 + throughput/total_tokens=196,416,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1024/500000] + train/ActionNoiseL2Loss=0.1085 + throughput/total_tokens=196,608,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1025/500000] + train/ActionNoiseL2Loss=0.1405 + throughput/total_tokens=196,800,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1026/500000] + train/ActionNoiseL2Loss=0.1260 + throughput/total_tokens=196,992,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1027/500000] + train/ActionNoiseL2Loss=0.1117 + throughput/total_tokens=197,184,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1028/500000] + train/ActionNoiseL2Loss=0.1797 + throughput/total_tokens=197,376,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1029/500000] + train/ActionNoiseL2Loss=0.1061 + throughput/total_tokens=197,568,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1030/500000] + train/ActionNoiseL2Loss=0.1027 + throughput/total_tokens=197,760,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1031/500000] + train/ActionNoiseL2Loss=0.1258 + throughput/total_tokens=197,952,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1032/500000] + train/ActionNoiseL2Loss=0.1568 + throughput/total_tokens=198,144,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1033/500000] + train/ActionNoiseL2Loss=0.1533 + throughput/total_tokens=198,336,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1034/500000] + train/ActionNoiseL2Loss=0.1341 + throughput/total_tokens=198,528,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1035/500000] + train/ActionNoiseL2Loss=0.1051 + throughput/total_tokens=198,720,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1036/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=198,912,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1037/500000] + train/ActionNoiseL2Loss=0.1450 + throughput/total_tokens=199,104,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1038/500000] + train/ActionNoiseL2Loss=0.1233 + throughput/total_tokens=199,296,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1039/500000] + train/ActionNoiseL2Loss=0.1238 + throughput/total_tokens=199,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1040/500000] + optim/total_grad_norm=4.902 + train/ActionNoiseL2Loss=0.1560 + throughput/total_tokens=199,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1041/500000] + train/ActionNoiseL2Loss=0.1703 + throughput/total_tokens=199,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1042/500000] + train/ActionNoiseL2Loss=0.1258 + throughput/total_tokens=200,064,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1043/500000] + train/ActionNoiseL2Loss=0.1457 + throughput/total_tokens=200,256,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1044/500000] + train/ActionNoiseL2Loss=0.1004 + throughput/total_tokens=200,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1045/500000] + train/ActionNoiseL2Loss=0.1294 + throughput/total_tokens=200,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1046/500000] + train/ActionNoiseL2Loss=0.0940 + throughput/total_tokens=200,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1047/500000] + train/ActionNoiseL2Loss=0.1665 + throughput/total_tokens=201,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1048/500000] + train/ActionNoiseL2Loss=0.1169 + throughput/total_tokens=201,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1049/500000] + train/ActionNoiseL2Loss=0.1081 + throughput/total_tokens=201,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1050/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=201,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1051/500000] + train/ActionNoiseL2Loss=0.0919 + throughput/total_tokens=201,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1052/500000] + train/ActionNoiseL2Loss=0.0859 + throughput/total_tokens=201,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1053/500000] + train/ActionNoiseL2Loss=0.0968 + throughput/total_tokens=202,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1054/500000] + train/ActionNoiseL2Loss=0.1421 + throughput/total_tokens=202,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1055/500000] + train/ActionNoiseL2Loss=0.1199 + throughput/total_tokens=202,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1056/500000] + train/ActionNoiseL2Loss=0.1864 + throughput/total_tokens=202,752,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1057/500000] + train/ActionNoiseL2Loss=0.1240 + throughput/total_tokens=202,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1058/500000] + train/ActionNoiseL2Loss=0.0927 + throughput/total_tokens=203,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1059/500000] + train/ActionNoiseL2Loss=0.1790 + throughput/total_tokens=203,328,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1060/500000] + optim/total_grad_norm=3.847 + train/ActionNoiseL2Loss=0.1497 + throughput/total_tokens=203,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1061/500000] + train/ActionNoiseL2Loss=0.1122 + throughput/total_tokens=203,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1062/500000] + train/ActionNoiseL2Loss=0.2019 + throughput/total_tokens=203,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1063/500000] + train/ActionNoiseL2Loss=0.1632 + throughput/total_tokens=204,096,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1064/500000] + train/ActionNoiseL2Loss=0.1350 + throughput/total_tokens=204,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1065/500000] + train/ActionNoiseL2Loss=0.1341 + throughput/total_tokens=204,480,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1066/500000] + train/ActionNoiseL2Loss=0.1294 + throughput/total_tokens=204,672,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1067/500000] + train/ActionNoiseL2Loss=0.2637 + throughput/total_tokens=204,864,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1068/500000] + train/ActionNoiseL2Loss=0.1038 + throughput/total_tokens=205,056,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1069/500000] + train/ActionNoiseL2Loss=0.2197 + throughput/total_tokens=205,248,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1070/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=205,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=1071/500000] + train/ActionNoiseL2Loss=0.1195 + throughput/total_tokens=205,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1072/500000] + train/ActionNoiseL2Loss=0.1177 + throughput/total_tokens=205,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1073/500000] + train/ActionNoiseL2Loss=0.1170 + throughput/total_tokens=206,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1074/500000] + train/ActionNoiseL2Loss=0.1434 + throughput/total_tokens=206,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1075/500000] + train/ActionNoiseL2Loss=0.1313 + throughput/total_tokens=206,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1076/500000] + train/ActionNoiseL2Loss=0.1373 + throughput/total_tokens=206,592,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1077/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=206,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1078/500000] + train/ActionNoiseL2Loss=0.1142 + throughput/total_tokens=206,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1079/500000] + train/ActionNoiseL2Loss=0.1089 + throughput/total_tokens=207,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1080/500000] + optim/total_grad_norm=3.521 + train/ActionNoiseL2Loss=0.1762 + throughput/total_tokens=207,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1081/500000] + train/ActionNoiseL2Loss=0.1171 + throughput/total_tokens=207,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1082/500000] + train/ActionNoiseL2Loss=0.1689 + throughput/total_tokens=207,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1083/500000] + train/ActionNoiseL2Loss=0.1741 + throughput/total_tokens=207,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1084/500000] + train/ActionNoiseL2Loss=0.1731 + throughput/total_tokens=208,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1085/500000] + train/ActionNoiseL2Loss=0.1242 + throughput/total_tokens=208,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1086/500000] + train/ActionNoiseL2Loss=0.1431 + throughput/total_tokens=208,512,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1087/500000] + train/ActionNoiseL2Loss=0.1299 + throughput/total_tokens=208,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1088/500000] + train/ActionNoiseL2Loss=0.1166 + throughput/total_tokens=208,896,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1089/500000] + train/ActionNoiseL2Loss=0.1452 + throughput/total_tokens=209,088,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1090/500000] + train/ActionNoiseL2Loss=0.1014 + throughput/total_tokens=209,280,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1091/500000] + train/ActionNoiseL2Loss=0.1169 + throughput/total_tokens=209,472,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1092/500000] + train/ActionNoiseL2Loss=0.1073 + throughput/total_tokens=209,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1093/500000] + train/ActionNoiseL2Loss=0.1653 + throughput/total_tokens=209,856,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1094/500000] + train/ActionNoiseL2Loss=0.1503 + throughput/total_tokens=210,048,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1095/500000] + train/ActionNoiseL2Loss=0.1765 + throughput/total_tokens=210,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1096/500000] + train/ActionNoiseL2Loss=0.1120 + throughput/total_tokens=210,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1097/500000] + train/ActionNoiseL2Loss=0.1504 + throughput/total_tokens=210,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1098/500000] + train/ActionNoiseL2Loss=0.1196 + throughput/total_tokens=210,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1099/500000] + train/ActionNoiseL2Loss=0.0956 + throughput/total_tokens=211,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1100/500000] + optim/total_grad_norm=1.843 + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=211,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1101/500000] + train/ActionNoiseL2Loss=0.1323 + throughput/total_tokens=211,392,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1102/500000] + train/ActionNoiseL2Loss=0.1016 + throughput/total_tokens=211,584,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1103/500000] + train/ActionNoiseL2Loss=0.1441 + throughput/total_tokens=211,776,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1104/500000] + train/ActionNoiseL2Loss=0.1306 + throughput/total_tokens=211,968,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1105/500000] + train/ActionNoiseL2Loss=0.1146 + throughput/total_tokens=212,160,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1106/500000] + train/ActionNoiseL2Loss=0.2467 + throughput/total_tokens=212,352,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1107/500000] + train/ActionNoiseL2Loss=0.1611 + throughput/total_tokens=212,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1108/500000] + train/ActionNoiseL2Loss=0.1041 + throughput/total_tokens=212,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1109/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=212,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1110/500000] + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=213,120,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=1111/500000] + train/ActionNoiseL2Loss=0.1553 + throughput/total_tokens=213,312,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1112/500000] + train/ActionNoiseL2Loss=0.1038 + throughput/total_tokens=213,504,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1113/500000] + train/ActionNoiseL2Loss=0.1215 + throughput/total_tokens=213,696,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1114/500000] + train/ActionNoiseL2Loss=0.1409 + throughput/total_tokens=213,888,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1115/500000] + train/ActionNoiseL2Loss=0.1652 + throughput/total_tokens=214,080,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1116/500000] + train/ActionNoiseL2Loss=0.1950 + throughput/total_tokens=214,272,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1117/500000] + train/ActionNoiseL2Loss=0.1361 + throughput/total_tokens=214,464,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1118/500000] + train/ActionNoiseL2Loss=0.1683 + throughput/total_tokens=214,656,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1119/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=214,848,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1120/500000] + optim/total_grad_norm=3.143 + train/ActionNoiseL2Loss=0.1246 + throughput/total_tokens=215,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1121/500000] + train/ActionNoiseL2Loss=0.1066 + throughput/total_tokens=215,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1122/500000] + train/ActionNoiseL2Loss=0.1132 + throughput/total_tokens=215,424,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1123/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=215,616,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1124/500000] + train/ActionNoiseL2Loss=0.1740 + throughput/total_tokens=215,808,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1125/500000] + train/ActionNoiseL2Loss=0.0919 + throughput/total_tokens=216,000,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1126/500000] + train/ActionNoiseL2Loss=0.0959 + throughput/total_tokens=216,192,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1127/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=216,384,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1128/500000] + train/ActionNoiseL2Loss=0.1005 + throughput/total_tokens=216,576,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1129/500000] + train/ActionNoiseL2Loss=0.1067 + throughput/total_tokens=216,768,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1130/500000] + train/ActionNoiseL2Loss=0.1580 + throughput/total_tokens=216,960,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1131/500000] + train/ActionNoiseL2Loss=0.1823 + throughput/total_tokens=217,152,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1132/500000] + train/ActionNoiseL2Loss=0.1009 + throughput/total_tokens=217,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1133/500000] + train/ActionNoiseL2Loss=0.1009 + throughput/total_tokens=217,536,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1134/500000] + train/ActionNoiseL2Loss=0.1175 + throughput/total_tokens=217,728,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1135/500000] + train/ActionNoiseL2Loss=0.1160 + throughput/total_tokens=217,920,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1136/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=218,112,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1137/500000] + train/ActionNoiseL2Loss=0.1154 + throughput/total_tokens=218,304,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1138/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=218,496,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1139/500000] + train/ActionNoiseL2Loss=0.0959 + throughput/total_tokens=218,688,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1140/500000] + optim/total_grad_norm=7.206 + train/ActionNoiseL2Loss=0.1999 + throughput/total_tokens=218,880,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1141/500000] + train/ActionNoiseL2Loss=0.2679 + throughput/total_tokens=219,072,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1142/500000] + train/ActionNoiseL2Loss=0.1405 + throughput/total_tokens=219,264,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1143/500000] + train/ActionNoiseL2Loss=0.1665 + throughput/total_tokens=219,456,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1144/500000] + train/ActionNoiseL2Loss=0.1051 + throughput/total_tokens=219,648,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1145/500000] + train/ActionNoiseL2Loss=0.2206 + throughput/total_tokens=219,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1146/500000] + train/ActionNoiseL2Loss=0.2013 + throughput/total_tokens=220,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1147/500000] + train/ActionNoiseL2Loss=0.1957 + throughput/total_tokens=220,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1148/500000] + train/ActionNoiseL2Loss=0.1741 + throughput/total_tokens=220,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1149/500000] + train/ActionNoiseL2Loss=0.1738 + throughput/total_tokens=220,608,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1150/500000] + train/ActionNoiseL2Loss=0.1142 + throughput/total_tokens=220,800,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1151/500000] + train/ActionNoiseL2Loss=0.1405 + throughput/total_tokens=220,992,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1152/500000] + train/ActionNoiseL2Loss=0.0824 + throughput/total_tokens=221,184,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1153/500000] + train/ActionNoiseL2Loss=0.1690 + throughput/total_tokens=221,376,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1154/500000] + train/ActionNoiseL2Loss=0.1215 + throughput/total_tokens=221,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1155/500000] + train/ActionNoiseL2Loss=0.1591 + throughput/total_tokens=221,760,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1156/500000] + train/ActionNoiseL2Loss=0.2533 + throughput/total_tokens=221,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1157/500000] + train/ActionNoiseL2Loss=0.2097 + throughput/total_tokens=222,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1158/500000] + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=222,336,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1159/500000] + train/ActionNoiseL2Loss=0.1117 + throughput/total_tokens=222,528,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1160/500000] + optim/total_grad_norm=2.133 + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=222,720,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1161/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=222,912,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1162/500000] + train/ActionNoiseL2Loss=0.1857 + throughput/total_tokens=223,104,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1163/500000] + train/ActionNoiseL2Loss=0.1259 + throughput/total_tokens=223,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1164/500000] + train/ActionNoiseL2Loss=0.1000 + throughput/total_tokens=223,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1165/500000] + train/ActionNoiseL2Loss=0.1447 + throughput/total_tokens=223,680,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1166/500000] + train/ActionNoiseL2Loss=0.1533 + throughput/total_tokens=223,872,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1167/500000] + train/ActionNoiseL2Loss=0.2602 + throughput/total_tokens=224,064,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1168/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=224,256,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1169/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=224,448,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1170/500000] + train/ActionNoiseL2Loss=0.0967 + throughput/total_tokens=224,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1171/500000] + train/ActionNoiseL2Loss=0.3256 + throughput/total_tokens=224,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1172/500000] + train/ActionNoiseL2Loss=0.1480 + throughput/total_tokens=225,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1173/500000] + train/ActionNoiseL2Loss=0.1742 + throughput/total_tokens=225,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1174/500000] + train/ActionNoiseL2Loss=0.2192 + throughput/total_tokens=225,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1175/500000] + train/ActionNoiseL2Loss=0.1397 + throughput/total_tokens=225,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1176/500000] + train/ActionNoiseL2Loss=0.1477 + throughput/total_tokens=225,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1177/500000] + train/ActionNoiseL2Loss=0.1277 + throughput/total_tokens=225,984,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1178/500000] + train/ActionNoiseL2Loss=0.1237 + throughput/total_tokens=226,176,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1179/500000] + train/ActionNoiseL2Loss=0.1485 + throughput/total_tokens=226,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1180/500000] + optim/total_grad_norm=3.099 + train/ActionNoiseL2Loss=0.0995 + throughput/total_tokens=226,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1181/500000] + train/ActionNoiseL2Loss=0.1383 + throughput/total_tokens=226,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1182/500000] + train/ActionNoiseL2Loss=0.1081 + throughput/total_tokens=226,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1183/500000] + train/ActionNoiseL2Loss=0.0985 + throughput/total_tokens=227,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1184/500000] + train/ActionNoiseL2Loss=0.1309 + throughput/total_tokens=227,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1185/500000] + train/ActionNoiseL2Loss=0.1306 + throughput/total_tokens=227,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1186/500000] + train/ActionNoiseL2Loss=0.2036 + throughput/total_tokens=227,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1187/500000] + train/ActionNoiseL2Loss=0.1710 + throughput/total_tokens=227,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1188/500000] + train/ActionNoiseL2Loss=0.1976 + throughput/total_tokens=228,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1189/500000] + train/ActionNoiseL2Loss=0.1615 + throughput/total_tokens=228,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1190/500000] + train/ActionNoiseL2Loss=0.1097 + throughput/total_tokens=228,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1191/500000] + train/ActionNoiseL2Loss=0.1432 + throughput/total_tokens=228,672,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1192/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=228,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1193/500000] + train/ActionNoiseL2Loss=0.1162 + throughput/total_tokens=229,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1194/500000] + train/ActionNoiseL2Loss=0.1307 + throughput/total_tokens=229,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1195/500000] + train/ActionNoiseL2Loss=0.1012 + throughput/total_tokens=229,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1196/500000] + train/ActionNoiseL2Loss=0.1031 + throughput/total_tokens=229,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1197/500000] + train/ActionNoiseL2Loss=0.0902 + throughput/total_tokens=229,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1198/500000] + train/ActionNoiseL2Loss=0.1302 + throughput/total_tokens=230,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1199/500000] + train/ActionNoiseL2Loss=0.1145 + throughput/total_tokens=230,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1200/500000] + optim/total_grad_norm=2.694 + train/ActionNoiseL2Loss=0.1366 + throughput/total_tokens=230,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=1201/500000] + train/ActionNoiseL2Loss=0.1442 + throughput/total_tokens=230,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1202/500000] + train/ActionNoiseL2Loss=0.0990 + throughput/total_tokens=230,784,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1203/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=230,976,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1204/500000] + train/ActionNoiseL2Loss=0.1575 + throughput/total_tokens=231,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1205/500000] + train/ActionNoiseL2Loss=0.1154 + throughput/total_tokens=231,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1206/500000] + train/ActionNoiseL2Loss=0.1512 + throughput/total_tokens=231,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1207/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=231,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1208/500000] + train/ActionNoiseL2Loss=0.0911 + throughput/total_tokens=231,936,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1209/500000] + train/ActionNoiseL2Loss=0.1366 + throughput/total_tokens=232,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1210/500000] + train/ActionNoiseL2Loss=0.1513 + throughput/total_tokens=232,320,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=1211/500000] + train/ActionNoiseL2Loss=0.1910 + throughput/total_tokens=232,512,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1212/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=232,704,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1213/500000] + train/ActionNoiseL2Loss=0.1918 + throughput/total_tokens=232,896,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1214/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=233,088,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1215/500000] + train/ActionNoiseL2Loss=0.1797 + throughput/total_tokens=233,280,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1216/500000] + train/ActionNoiseL2Loss=0.1816 + throughput/total_tokens=233,472,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1217/500000] + train/ActionNoiseL2Loss=0.1090 + throughput/total_tokens=233,664,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1218/500000] + train/ActionNoiseL2Loss=0.1587 + throughput/total_tokens=233,856,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1219/500000] + train/ActionNoiseL2Loss=0.1041 + throughput/total_tokens=234,048,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1220/500000] + optim/total_grad_norm=1.748 + train/ActionNoiseL2Loss=0.1212 + throughput/total_tokens=234,240,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1221/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=234,432,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1222/500000] + train/ActionNoiseL2Loss=0.2019 + throughput/total_tokens=234,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1223/500000] + train/ActionNoiseL2Loss=0.1384 + throughput/total_tokens=234,816,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1224/500000] + train/ActionNoiseL2Loss=0.1215 + throughput/total_tokens=235,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1225/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=235,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1226/500000] + train/ActionNoiseL2Loss=0.0947 + throughput/total_tokens=235,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1227/500000] + train/ActionNoiseL2Loss=0.1598 + throughput/total_tokens=235,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1228/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=235,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1229/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=235,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1230/500000] + train/ActionNoiseL2Loss=0.1018 + throughput/total_tokens=236,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1231/500000] + train/ActionNoiseL2Loss=0.1508 + throughput/total_tokens=236,352,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1232/500000] + train/ActionNoiseL2Loss=0.1555 + throughput/total_tokens=236,544,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1233/500000] + train/ActionNoiseL2Loss=0.1531 + throughput/total_tokens=236,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1234/500000] + train/ActionNoiseL2Loss=0.1863 + throughput/total_tokens=236,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1235/500000] + train/ActionNoiseL2Loss=0.1334 + throughput/total_tokens=237,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1236/500000] + train/ActionNoiseL2Loss=0.2222 + throughput/total_tokens=237,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1237/500000] + train/ActionNoiseL2Loss=0.1091 + throughput/total_tokens=237,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1238/500000] + train/ActionNoiseL2Loss=0.1184 + throughput/total_tokens=237,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1239/500000] + train/ActionNoiseL2Loss=0.0886 + throughput/total_tokens=237,888,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1240/500000] + optim/total_grad_norm=3.251 + train/ActionNoiseL2Loss=0.1418 + throughput/total_tokens=238,080,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1241/500000] + train/ActionNoiseL2Loss=0.1230 + throughput/total_tokens=238,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1242/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=238,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1243/500000] + train/ActionNoiseL2Loss=0.1705 + throughput/total_tokens=238,656,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1244/500000] + train/ActionNoiseL2Loss=0.1671 + throughput/total_tokens=238,848,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1245/500000] + train/ActionNoiseL2Loss=0.1361 + throughput/total_tokens=239,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1246/500000] + train/ActionNoiseL2Loss=0.1601 + throughput/total_tokens=239,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1247/500000] + train/ActionNoiseL2Loss=0.1294 + throughput/total_tokens=239,424,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1248/500000] + train/ActionNoiseL2Loss=0.1008 + throughput/total_tokens=239,616,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1249/500000] + train/ActionNoiseL2Loss=0.1366 + throughput/total_tokens=239,808,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1250/500000] + train/ActionNoiseL2Loss=0.1046 + throughput/total_tokens=240,000,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1251/500000] + train/ActionNoiseL2Loss=0.1701 + throughput/total_tokens=240,192,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1252/500000] + train/ActionNoiseL2Loss=0.1229 + throughput/total_tokens=240,384,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1253/500000] + train/ActionNoiseL2Loss=0.1296 + throughput/total_tokens=240,576,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1254/500000] + train/ActionNoiseL2Loss=0.1363 + throughput/total_tokens=240,768,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1255/500000] + train/ActionNoiseL2Loss=0.1237 + throughput/total_tokens=240,960,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1256/500000] + train/ActionNoiseL2Loss=0.1407 + throughput/total_tokens=241,152,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1257/500000] + train/ActionNoiseL2Loss=0.1216 + throughput/total_tokens=241,344,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1258/500000] + train/ActionNoiseL2Loss=0.1186 + throughput/total_tokens=241,536,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1259/500000] + train/ActionNoiseL2Loss=0.1474 + throughput/total_tokens=241,728,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1260/500000] + optim/total_grad_norm=3.474 + train/ActionNoiseL2Loss=0.1184 + throughput/total_tokens=241,920,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=1261/500000] + train/ActionNoiseL2Loss=0.1180 + throughput/total_tokens=242,112,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1262/500000] + train/ActionNoiseL2Loss=0.1903 + throughput/total_tokens=242,304,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1263/500000] + train/ActionNoiseL2Loss=0.1162 + throughput/total_tokens=242,496,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1264/500000] + train/ActionNoiseL2Loss=0.1050 + throughput/total_tokens=242,688,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1265/500000] + train/ActionNoiseL2Loss=0.1350 + throughput/total_tokens=242,880,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1266/500000] + train/ActionNoiseL2Loss=0.1091 + throughput/total_tokens=243,072,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1267/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=243,264,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1268/500000] + train/ActionNoiseL2Loss=0.1023 + throughput/total_tokens=243,456,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1269/500000] + train/ActionNoiseL2Loss=0.1647 + throughput/total_tokens=243,648,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1270/500000] + train/ActionNoiseL2Loss=0.1635 + throughput/total_tokens=243,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1271/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=244,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1272/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=244,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1273/500000] + train/ActionNoiseL2Loss=0.1224 + throughput/total_tokens=244,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1274/500000] + train/ActionNoiseL2Loss=0.1518 + throughput/total_tokens=244,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1275/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=244,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1276/500000] + train/ActionNoiseL2Loss=0.1468 + throughput/total_tokens=244,992,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1277/500000] + train/ActionNoiseL2Loss=0.1012 + throughput/total_tokens=245,184,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1278/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=245,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1279/500000] + train/ActionNoiseL2Loss=0.1675 + throughput/total_tokens=245,568,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1280/500000] + optim/total_grad_norm=4.246 + train/ActionNoiseL2Loss=0.1250 + throughput/total_tokens=245,760,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1281/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=245,952,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1282/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=246,144,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1283/500000] + train/ActionNoiseL2Loss=0.1003 + throughput/total_tokens=246,336,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1284/500000] + train/ActionNoiseL2Loss=0.1342 + throughput/total_tokens=246,528,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1285/500000] + train/ActionNoiseL2Loss=0.1162 + throughput/total_tokens=246,720,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1286/500000] + train/ActionNoiseL2Loss=0.1771 + throughput/total_tokens=246,912,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1287/500000] + train/ActionNoiseL2Loss=0.1024 + throughput/total_tokens=247,104,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1288/500000] + train/ActionNoiseL2Loss=0.0851 + throughput/total_tokens=247,296,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1289/500000] + train/ActionNoiseL2Loss=0.1003 + throughput/total_tokens=247,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1290/500000] + train/ActionNoiseL2Loss=0.1756 + throughput/total_tokens=247,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1291/500000] + train/ActionNoiseL2Loss=0.2100 + throughput/total_tokens=247,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1292/500000] + train/ActionNoiseL2Loss=0.1279 + throughput/total_tokens=248,064,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1293/500000] + train/ActionNoiseL2Loss=0.1809 + throughput/total_tokens=248,256,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1294/500000] + train/ActionNoiseL2Loss=0.1082 + throughput/total_tokens=248,448,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1295/500000] + train/ActionNoiseL2Loss=0.1766 + throughput/total_tokens=248,640,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1296/500000] + train/ActionNoiseL2Loss=0.1824 + throughput/total_tokens=248,832,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1297/500000] + train/ActionNoiseL2Loss=0.1449 + throughput/total_tokens=249,024,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1298/500000] + train/ActionNoiseL2Loss=0.1832 + throughput/total_tokens=249,216,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1299/500000] + train/ActionNoiseL2Loss=0.1330 + throughput/total_tokens=249,408,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1300/500000] + optim/total_grad_norm=2.675 + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=249,600,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1301/500000] + train/ActionNoiseL2Loss=0.1370 + throughput/total_tokens=249,792,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=1302/500000] + train/ActionNoiseL2Loss=0.1273 + throughput/total_tokens=249,984,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1303/500000] + train/ActionNoiseL2Loss=0.1210 + throughput/total_tokens=250,176,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1304/500000] + train/ActionNoiseL2Loss=0.1046 + throughput/total_tokens=250,368,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1305/500000] + train/ActionNoiseL2Loss=0.0877 + throughput/total_tokens=250,560,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1306/500000] + train/ActionNoiseL2Loss=0.1113 + throughput/total_tokens=250,752,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1307/500000] + train/ActionNoiseL2Loss=0.1113 + throughput/total_tokens=250,944,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1308/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=251,136,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1309/500000] + train/ActionNoiseL2Loss=0.0845 + throughput/total_tokens=251,328,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=1310/500000] + train/ActionNoiseL2Loss=0.1237 + throughput/total_tokens=251,520,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=1311/500000] + train/ActionNoiseL2Loss=0.1209 + throughput/total_tokens=251,712,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1312/500000] + train/ActionNoiseL2Loss=0.1424 + throughput/total_tokens=251,904,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1313/500000] + train/ActionNoiseL2Loss=0.1296 + throughput/total_tokens=252,096,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1314/500000] + train/ActionNoiseL2Loss=0.1052 + throughput/total_tokens=252,288,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1315/500000] + train/ActionNoiseL2Loss=0.1331 + throughput/total_tokens=252,480,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1316/500000] + train/ActionNoiseL2Loss=0.1282 + throughput/total_tokens=252,672,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1317/500000] + train/ActionNoiseL2Loss=0.1339 + throughput/total_tokens=252,864,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1318/500000] + train/ActionNoiseL2Loss=0.1498 + throughput/total_tokens=253,056,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1319/500000] + train/ActionNoiseL2Loss=0.1748 + throughput/total_tokens=253,248,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1320/500000] + optim/total_grad_norm=2.997 + train/ActionNoiseL2Loss=0.1711 + throughput/total_tokens=253,440,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1321/500000] + train/ActionNoiseL2Loss=0.1744 + throughput/total_tokens=253,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1322/500000] + train/ActionNoiseL2Loss=0.0987 + throughput/total_tokens=253,824,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1323/500000] + train/ActionNoiseL2Loss=0.0916 + throughput/total_tokens=254,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1324/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=254,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1325/500000] + train/ActionNoiseL2Loss=0.1230 + throughput/total_tokens=254,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1326/500000] + train/ActionNoiseL2Loss=0.1002 + throughput/total_tokens=254,592,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1327/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=254,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1328/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=254,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1329/500000] + train/ActionNoiseL2Loss=0.1025 + throughput/total_tokens=255,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1330/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=255,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1331/500000] + train/ActionNoiseL2Loss=0.1390 + throughput/total_tokens=255,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1332/500000] + train/ActionNoiseL2Loss=0.1238 + throughput/total_tokens=255,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1333/500000] + train/ActionNoiseL2Loss=0.1722 + throughput/total_tokens=255,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1334/500000] + train/ActionNoiseL2Loss=0.1298 + throughput/total_tokens=256,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1335/500000] + train/ActionNoiseL2Loss=0.1034 + throughput/total_tokens=256,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1336/500000] + train/ActionNoiseL2Loss=0.1327 + throughput/total_tokens=256,512,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1337/500000] + train/ActionNoiseL2Loss=0.1075 + throughput/total_tokens=256,704,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1338/500000] + train/ActionNoiseL2Loss=0.1046 + throughput/total_tokens=256,896,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1339/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=257,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1340/500000] + optim/total_grad_norm=3.030 + train/ActionNoiseL2Loss=0.1406 + throughput/total_tokens=257,280,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1341/500000] + train/ActionNoiseL2Loss=0.1081 + throughput/total_tokens=257,472,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1342/500000] + train/ActionNoiseL2Loss=0.0972 + throughput/total_tokens=257,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1343/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=257,856,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1344/500000] + train/ActionNoiseL2Loss=0.1395 + throughput/total_tokens=258,048,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1345/500000] + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=258,240,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1346/500000] + train/ActionNoiseL2Loss=0.1117 + throughput/total_tokens=258,432,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1347/500000] + train/ActionNoiseL2Loss=0.0950 + throughput/total_tokens=258,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1348/500000] + train/ActionNoiseL2Loss=0.2433 + throughput/total_tokens=258,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1349/500000] + train/ActionNoiseL2Loss=0.1400 + throughput/total_tokens=259,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1350/500000] + train/ActionNoiseL2Loss=0.1283 + throughput/total_tokens=259,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1351/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=259,392,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1352/500000] + train/ActionNoiseL2Loss=0.0910 + throughput/total_tokens=259,584,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1353/500000] + train/ActionNoiseL2Loss=0.1307 + throughput/total_tokens=259,776,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1354/500000] + train/ActionNoiseL2Loss=0.2089 + throughput/total_tokens=259,968,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1355/500000] + train/ActionNoiseL2Loss=0.1505 + throughput/total_tokens=260,160,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1356/500000] + train/ActionNoiseL2Loss=0.0893 + throughput/total_tokens=260,352,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1357/500000] + train/ActionNoiseL2Loss=0.1427 + throughput/total_tokens=260,544,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1358/500000] + train/ActionNoiseL2Loss=0.1890 + throughput/total_tokens=260,736,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1359/500000] + train/ActionNoiseL2Loss=0.1157 + throughput/total_tokens=260,928,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1360/500000] + optim/total_grad_norm=4.320 + train/ActionNoiseL2Loss=0.1477 + throughput/total_tokens=261,120,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=1361/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=261,312,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1362/500000] + train/ActionNoiseL2Loss=0.1706 + throughput/total_tokens=261,504,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1363/500000] + train/ActionNoiseL2Loss=0.1383 + throughput/total_tokens=261,696,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1364/500000] + train/ActionNoiseL2Loss=0.1637 + throughput/total_tokens=261,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1365/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=262,080,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1366/500000] + train/ActionNoiseL2Loss=0.1505 + throughput/total_tokens=262,272,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1367/500000] + train/ActionNoiseL2Loss=0.1762 + throughput/total_tokens=262,464,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1368/500000] + train/ActionNoiseL2Loss=0.1580 + throughput/total_tokens=262,656,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1369/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=262,848,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1370/500000] + train/ActionNoiseL2Loss=0.2666 + throughput/total_tokens=263,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1371/500000] + train/ActionNoiseL2Loss=0.1241 + throughput/total_tokens=263,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1372/500000] + train/ActionNoiseL2Loss=0.2174 + throughput/total_tokens=263,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1373/500000] + train/ActionNoiseL2Loss=0.1818 + throughput/total_tokens=263,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1374/500000] + train/ActionNoiseL2Loss=0.1591 + throughput/total_tokens=263,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1375/500000] + train/ActionNoiseL2Loss=0.0843 + throughput/total_tokens=264,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1376/500000] + train/ActionNoiseL2Loss=0.1345 + throughput/total_tokens=264,192,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1377/500000] + train/ActionNoiseL2Loss=0.1429 + throughput/total_tokens=264,384,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1378/500000] + train/ActionNoiseL2Loss=0.1733 + throughput/total_tokens=264,576,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1379/500000] + train/ActionNoiseL2Loss=0.1882 + throughput/total_tokens=264,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1380/500000] + optim/total_grad_norm=2.852 + train/ActionNoiseL2Loss=0.1153 + throughput/total_tokens=264,960,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1381/500000] + train/ActionNoiseL2Loss=0.1844 + throughput/total_tokens=265,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1382/500000] + train/ActionNoiseL2Loss=0.2522 + throughput/total_tokens=265,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1383/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=265,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1384/500000] + train/ActionNoiseL2Loss=0.0915 + throughput/total_tokens=265,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1385/500000] + train/ActionNoiseL2Loss=0.1255 + throughput/total_tokens=265,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1386/500000] + train/ActionNoiseL2Loss=0.1099 + throughput/total_tokens=266,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1387/500000] + train/ActionNoiseL2Loss=0.1690 + throughput/total_tokens=266,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1388/500000] + train/ActionNoiseL2Loss=0.1601 + throughput/total_tokens=266,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1389/500000] + train/ActionNoiseL2Loss=0.1522 + throughput/total_tokens=266,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1390/500000] + train/ActionNoiseL2Loss=0.1328 + throughput/total_tokens=266,880,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1391/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=267,072,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1392/500000] + train/ActionNoiseL2Loss=0.0980 + throughput/total_tokens=267,264,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1393/500000] + train/ActionNoiseL2Loss=0.1399 + throughput/total_tokens=267,456,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1394/500000] + train/ActionNoiseL2Loss=0.1095 + throughput/total_tokens=267,648,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1395/500000] + train/ActionNoiseL2Loss=0.1467 + throughput/total_tokens=267,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1396/500000] + train/ActionNoiseL2Loss=0.0994 + throughput/total_tokens=268,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1397/500000] + train/ActionNoiseL2Loss=0.1188 + throughput/total_tokens=268,224,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1398/500000] + train/ActionNoiseL2Loss=0.1250 + throughput/total_tokens=268,416,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1399/500000] + train/ActionNoiseL2Loss=0.1912 + throughput/total_tokens=268,608,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1400/500000] + optim/total_grad_norm=3.741 + train/ActionNoiseL2Loss=0.1019 + throughput/total_tokens=268,800,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1401/500000] + train/ActionNoiseL2Loss=0.1403 + throughput/total_tokens=268,992,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0475 +[step=1402/500000] + train/ActionNoiseL2Loss=0.1649 + throughput/total_tokens=269,184,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=1403/500000] + train/ActionNoiseL2Loss=0.1103 + throughput/total_tokens=269,376,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=1404/500000] + train/ActionNoiseL2Loss=0.1828 + throughput/total_tokens=269,568,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=1405/500000] + train/ActionNoiseL2Loss=0.1405 + throughput/total_tokens=269,760,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=1406/500000] + train/ActionNoiseL2Loss=0.1362 + throughput/total_tokens=269,952,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=1407/500000] + train/ActionNoiseL2Loss=0.1156 + throughput/total_tokens=270,144,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=1408/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=270,336,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=1409/500000] + train/ActionNoiseL2Loss=0.1164 + throughput/total_tokens=270,528,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=1410/500000] + train/ActionNoiseL2Loss=0.1798 + throughput/total_tokens=270,720,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 + System/Peak GPU Memory (MB)=51,076 +[step=1411/500000] + train/ActionNoiseL2Loss=0.1683 + throughput/total_tokens=270,912,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=1412/500000] + train/ActionNoiseL2Loss=0.0990 + throughput/total_tokens=271,104,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=1413/500000] + train/ActionNoiseL2Loss=0.2568 + throughput/total_tokens=271,296,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=1414/500000] + train/ActionNoiseL2Loss=0.1341 + throughput/total_tokens=271,488,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0475 +[step=1415/500000] + train/ActionNoiseL2Loss=0.1327 + throughput/total_tokens=271,680,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0474 +[step=1416/500000] + train/ActionNoiseL2Loss=0.1664 + throughput/total_tokens=271,872,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0474 +[step=1417/500000] + train/ActionNoiseL2Loss=0.1234 + throughput/total_tokens=272,064,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0475 +[step=1418/500000] + train/ActionNoiseL2Loss=0.1061 + throughput/total_tokens=272,256,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0474 +[step=1419/500000] + train/ActionNoiseL2Loss=0.1986 + throughput/total_tokens=272,448,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0474 +[step=1420/500000] + optim/total_grad_norm=4.227 + train/ActionNoiseL2Loss=0.1423 + throughput/total_tokens=272,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1421/500000] + train/ActionNoiseL2Loss=0.1354 + throughput/total_tokens=272,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1422/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=273,024,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1423/500000] + train/ActionNoiseL2Loss=0.0947 + throughput/total_tokens=273,216,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1424/500000] + train/ActionNoiseL2Loss=0.2221 + throughput/total_tokens=273,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1425/500000] + train/ActionNoiseL2Loss=0.1626 + throughput/total_tokens=273,600,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1426/500000] + train/ActionNoiseL2Loss=0.0966 + throughput/total_tokens=273,792,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1427/500000] + train/ActionNoiseL2Loss=0.1208 + throughput/total_tokens=273,984,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1428/500000] + train/ActionNoiseL2Loss=0.1238 + throughput/total_tokens=274,176,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1429/500000] + train/ActionNoiseL2Loss=0.1372 + throughput/total_tokens=274,368,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1430/500000] + train/ActionNoiseL2Loss=0.0914 + throughput/total_tokens=274,560,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1431/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=274,752,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1432/500000] + train/ActionNoiseL2Loss=0.1600 + throughput/total_tokens=274,944,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1433/500000] + train/ActionNoiseL2Loss=0.1145 + throughput/total_tokens=275,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1434/500000] + train/ActionNoiseL2Loss=0.1241 + throughput/total_tokens=275,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1435/500000] + train/ActionNoiseL2Loss=0.0868 + throughput/total_tokens=275,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1436/500000] + train/ActionNoiseL2Loss=0.1094 + throughput/total_tokens=275,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1437/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=275,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1438/500000] + train/ActionNoiseL2Loss=0.1341 + throughput/total_tokens=276,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1439/500000] + train/ActionNoiseL2Loss=0.1191 + throughput/total_tokens=276,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1440/500000] + optim/total_grad_norm=2.176 + train/ActionNoiseL2Loss=0.1071 + throughput/total_tokens=276,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1441/500000] + train/ActionNoiseL2Loss=0.1006 + throughput/total_tokens=276,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1442/500000] + train/ActionNoiseL2Loss=0.1474 + throughput/total_tokens=276,864,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1443/500000] + train/ActionNoiseL2Loss=0.1212 + throughput/total_tokens=277,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1444/500000] + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=277,248,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1445/500000] + train/ActionNoiseL2Loss=0.1266 + throughput/total_tokens=277,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1446/500000] + train/ActionNoiseL2Loss=0.0963 + throughput/total_tokens=277,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1447/500000] + train/ActionNoiseL2Loss=0.1460 + throughput/total_tokens=277,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1448/500000] + train/ActionNoiseL2Loss=0.1048 + throughput/total_tokens=278,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1449/500000] + train/ActionNoiseL2Loss=0.1213 + throughput/total_tokens=278,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1450/500000] + train/ActionNoiseL2Loss=0.1166 + throughput/total_tokens=278,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1451/500000] + train/ActionNoiseL2Loss=0.1814 + throughput/total_tokens=278,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1452/500000] + train/ActionNoiseL2Loss=0.0981 + throughput/total_tokens=278,784,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1453/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=278,976,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1454/500000] + train/ActionNoiseL2Loss=0.2078 + throughput/total_tokens=279,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1455/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=279,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1456/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=279,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1457/500000] + train/ActionNoiseL2Loss=0.0906 + throughput/total_tokens=279,744,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1458/500000] + train/ActionNoiseL2Loss=0.1164 + throughput/total_tokens=279,936,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1459/500000] + train/ActionNoiseL2Loss=0.1373 + throughput/total_tokens=280,128,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1460/500000] + optim/total_grad_norm=3.816 + train/ActionNoiseL2Loss=0.1549 + throughput/total_tokens=280,320,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=1461/500000] + train/ActionNoiseL2Loss=0.1832 + throughput/total_tokens=280,512,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1462/500000] + train/ActionNoiseL2Loss=0.1001 + throughput/total_tokens=280,704,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1463/500000] + train/ActionNoiseL2Loss=0.0948 + throughput/total_tokens=280,896,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1464/500000] + train/ActionNoiseL2Loss=0.1186 + throughput/total_tokens=281,088,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1465/500000] + train/ActionNoiseL2Loss=0.1363 + throughput/total_tokens=281,280,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1466/500000] + train/ActionNoiseL2Loss=0.0957 + throughput/total_tokens=281,472,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1467/500000] + train/ActionNoiseL2Loss=0.1057 + throughput/total_tokens=281,664,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1468/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=281,856,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1469/500000] + train/ActionNoiseL2Loss=0.1190 + throughput/total_tokens=282,048,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1470/500000] + train/ActionNoiseL2Loss=0.1006 + throughput/total_tokens=282,240,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1471/500000] + train/ActionNoiseL2Loss=0.1066 + throughput/total_tokens=282,432,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1472/500000] + train/ActionNoiseL2Loss=0.0853 + throughput/total_tokens=282,624,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1473/500000] + train/ActionNoiseL2Loss=0.1566 + throughput/total_tokens=282,816,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1474/500000] + train/ActionNoiseL2Loss=0.1503 + throughput/total_tokens=283,008,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1475/500000] + train/ActionNoiseL2Loss=0.1076 + throughput/total_tokens=283,200,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1476/500000] + train/ActionNoiseL2Loss=0.1554 + throughput/total_tokens=283,392,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1477/500000] + train/ActionNoiseL2Loss=0.1601 + throughput/total_tokens=283,584,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1478/500000] + train/ActionNoiseL2Loss=0.1073 + throughput/total_tokens=283,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1479/500000] + train/ActionNoiseL2Loss=0.1173 + throughput/total_tokens=283,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1480/500000] + optim/total_grad_norm=1.834 + train/ActionNoiseL2Loss=0.1275 + throughput/total_tokens=284,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1481/500000] + train/ActionNoiseL2Loss=0.1309 + throughput/total_tokens=284,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1482/500000] + train/ActionNoiseL2Loss=0.1348 + throughput/total_tokens=284,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1483/500000] + train/ActionNoiseL2Loss=0.1770 + throughput/total_tokens=284,736,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1484/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=284,928,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1485/500000] + train/ActionNoiseL2Loss=0.1341 + throughput/total_tokens=285,120,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1486/500000] + train/ActionNoiseL2Loss=0.1017 + throughput/total_tokens=285,312,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1487/500000] + train/ActionNoiseL2Loss=0.1502 + throughput/total_tokens=285,504,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1488/500000] + train/ActionNoiseL2Loss=0.1411 + throughput/total_tokens=285,696,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1489/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=285,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1490/500000] + train/ActionNoiseL2Loss=0.1145 + throughput/total_tokens=286,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1491/500000] + train/ActionNoiseL2Loss=0.1014 + throughput/total_tokens=286,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1492/500000] + train/ActionNoiseL2Loss=0.1126 + throughput/total_tokens=286,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1493/500000] + train/ActionNoiseL2Loss=0.1321 + throughput/total_tokens=286,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1494/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=286,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1495/500000] + train/ActionNoiseL2Loss=0.1046 + throughput/total_tokens=287,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1496/500000] + train/ActionNoiseL2Loss=0.1415 + throughput/total_tokens=287,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1497/500000] + train/ActionNoiseL2Loss=0.1196 + throughput/total_tokens=287,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1498/500000] + train/ActionNoiseL2Loss=0.1899 + throughput/total_tokens=287,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1499/500000] + train/ActionNoiseL2Loss=0.1051 + throughput/total_tokens=287,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1500/500000] + optim/total_grad_norm=3.736 + train/ActionNoiseL2Loss=0.1648 + throughput/total_tokens=288,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +10/12 [01:34:16] INFO | >> Saving config... checkpoint.py:608 +10/12 [01:34:49] INFO | >> Saving model state... checkpoint.py:796 +10/12 [01:35:57] INFO | >> Saving optim state... checkpoint.py:811 +10/12 [01:37:28] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=1501/500000] + train/ActionNoiseL2Loss=0.1542 + throughput/total_tokens=288,192,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=1502/500000] + train/ActionNoiseL2Loss=0.1046 + throughput/total_tokens=288,384,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=1503/500000] + train/ActionNoiseL2Loss=0.2380 + throughput/total_tokens=288,576,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1504/500000] + train/ActionNoiseL2Loss=0.2194 + throughput/total_tokens=288,768,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1505/500000] + train/ActionNoiseL2Loss=0.1056 + throughput/total_tokens=288,960,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1506/500000] + train/ActionNoiseL2Loss=0.1887 + throughput/total_tokens=289,152,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1507/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=289,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1508/500000] + train/ActionNoiseL2Loss=0.1224 + throughput/total_tokens=289,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1509/500000] + train/ActionNoiseL2Loss=0.1662 + throughput/total_tokens=289,728,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1510/500000] + train/ActionNoiseL2Loss=0.1778 + throughput/total_tokens=289,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1511/500000] + train/ActionNoiseL2Loss=0.1163 + throughput/total_tokens=290,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1512/500000] + train/ActionNoiseL2Loss=0.1364 + throughput/total_tokens=290,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1513/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=290,496,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1514/500000] + train/ActionNoiseL2Loss=0.1026 + throughput/total_tokens=290,688,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1515/500000] + train/ActionNoiseL2Loss=0.1382 + throughput/total_tokens=290,880,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1516/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=291,072,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1517/500000] + train/ActionNoiseL2Loss=0.0991 + throughput/total_tokens=291,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1518/500000] + train/ActionNoiseL2Loss=0.0918 + throughput/total_tokens=291,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1519/500000] + train/ActionNoiseL2Loss=0.1306 + throughput/total_tokens=291,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1520/500000] + optim/total_grad_norm=2.514 + train/ActionNoiseL2Loss=0.0983 + throughput/total_tokens=291,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1521/500000] + train/ActionNoiseL2Loss=0.1586 + throughput/total_tokens=292,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1522/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=292,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1523/500000] + train/ActionNoiseL2Loss=0.1201 + throughput/total_tokens=292,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1524/500000] + train/ActionNoiseL2Loss=0.1031 + throughput/total_tokens=292,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1525/500000] + train/ActionNoiseL2Loss=0.0881 + throughput/total_tokens=292,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1526/500000] + train/ActionNoiseL2Loss=0.1569 + throughput/total_tokens=292,992,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1527/500000] + train/ActionNoiseL2Loss=0.1274 + throughput/total_tokens=293,184,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1528/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=293,376,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1529/500000] + train/ActionNoiseL2Loss=0.0900 + throughput/total_tokens=293,568,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1530/500000] + train/ActionNoiseL2Loss=0.1108 + throughput/total_tokens=293,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1531/500000] + train/ActionNoiseL2Loss=0.0901 + throughput/total_tokens=293,952,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1532/500000] + train/ActionNoiseL2Loss=0.1833 + throughput/total_tokens=294,144,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1533/500000] + train/ActionNoiseL2Loss=0.1383 + throughput/total_tokens=294,336,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1534/500000] + train/ActionNoiseL2Loss=0.1411 + throughput/total_tokens=294,528,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1535/500000] + train/ActionNoiseL2Loss=0.1393 + throughput/total_tokens=294,720,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1536/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=294,912,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1537/500000] + train/ActionNoiseL2Loss=0.0988 + throughput/total_tokens=295,104,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1538/500000] + train/ActionNoiseL2Loss=0.1486 + throughput/total_tokens=295,296,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1539/500000] + train/ActionNoiseL2Loss=0.1150 + throughput/total_tokens=295,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1540/500000] + optim/total_grad_norm=2.033 + train/ActionNoiseL2Loss=0.1132 + throughput/total_tokens=295,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1541/500000] + train/ActionNoiseL2Loss=0.1114 + throughput/total_tokens=295,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1542/500000] + train/ActionNoiseL2Loss=0.1244 + throughput/total_tokens=296,064,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1543/500000] + train/ActionNoiseL2Loss=0.0988 + throughput/total_tokens=296,256,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1544/500000] + train/ActionNoiseL2Loss=0.1255 + throughput/total_tokens=296,448,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1545/500000] + train/ActionNoiseL2Loss=0.1131 + throughput/total_tokens=296,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1546/500000] + train/ActionNoiseL2Loss=0.0865 + throughput/total_tokens=296,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1547/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=297,024,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1548/500000] + train/ActionNoiseL2Loss=0.1163 + throughput/total_tokens=297,216,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1549/500000] + train/ActionNoiseL2Loss=0.1028 + throughput/total_tokens=297,408,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1550/500000] + train/ActionNoiseL2Loss=0.0985 + throughput/total_tokens=297,600,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1551/500000] + train/ActionNoiseL2Loss=0.0838 + throughput/total_tokens=297,792,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=1552/500000] + train/ActionNoiseL2Loss=0.1304 + throughput/total_tokens=297,984,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1553/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=298,176,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=1554/500000] + train/ActionNoiseL2Loss=0.1126 + throughput/total_tokens=298,368,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=1555/500000] + train/ActionNoiseL2Loss=0.0943 + throughput/total_tokens=298,560,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=1556/500000] + train/ActionNoiseL2Loss=0.1328 + throughput/total_tokens=298,752,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=1557/500000] + train/ActionNoiseL2Loss=0.1084 + throughput/total_tokens=298,944,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1558/500000] + train/ActionNoiseL2Loss=0.1064 + throughput/total_tokens=299,136,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1559/500000] + train/ActionNoiseL2Loss=0.1008 + throughput/total_tokens=299,328,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1560/500000] + optim/total_grad_norm=2.437 + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=299,520,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=1561/500000] + train/ActionNoiseL2Loss=0.1089 + throughput/total_tokens=299,712,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1562/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=299,904,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=1563/500000] + train/ActionNoiseL2Loss=0.1109 + throughput/total_tokens=300,096,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=1564/500000] + train/ActionNoiseL2Loss=0.1232 + throughput/total_tokens=300,288,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=1565/500000] + train/ActionNoiseL2Loss=0.1495 + throughput/total_tokens=300,480,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=1566/500000] + train/ActionNoiseL2Loss=0.1394 + throughput/total_tokens=300,672,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=1567/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=300,864,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=1568/500000] + train/ActionNoiseL2Loss=0.0924 + throughput/total_tokens=301,056,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1569/500000] + train/ActionNoiseL2Loss=0.2135 + throughput/total_tokens=301,248,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1570/500000] + train/ActionNoiseL2Loss=0.1803 + throughput/total_tokens=301,440,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1571/500000] + train/ActionNoiseL2Loss=0.1265 + throughput/total_tokens=301,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1572/500000] + train/ActionNoiseL2Loss=0.1278 + throughput/total_tokens=301,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1573/500000] + train/ActionNoiseL2Loss=0.1284 + throughput/total_tokens=302,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1574/500000] + train/ActionNoiseL2Loss=0.1322 + throughput/total_tokens=302,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1575/500000] + train/ActionNoiseL2Loss=0.1241 + throughput/total_tokens=302,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1576/500000] + train/ActionNoiseL2Loss=0.1698 + throughput/total_tokens=302,592,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1577/500000] + train/ActionNoiseL2Loss=0.1882 + throughput/total_tokens=302,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1578/500000] + train/ActionNoiseL2Loss=0.1235 + throughput/total_tokens=302,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1579/500000] + train/ActionNoiseL2Loss=0.2130 + throughput/total_tokens=303,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1580/500000] + optim/total_grad_norm=3.304 + train/ActionNoiseL2Loss=0.2065 + throughput/total_tokens=303,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1581/500000] + train/ActionNoiseL2Loss=0.1197 + throughput/total_tokens=303,552,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1582/500000] + train/ActionNoiseL2Loss=0.1116 + throughput/total_tokens=303,744,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1583/500000] + train/ActionNoiseL2Loss=0.1117 + throughput/total_tokens=303,936,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1584/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=304,128,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1585/500000] + train/ActionNoiseL2Loss=0.1454 + throughput/total_tokens=304,320,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1586/500000] + train/ActionNoiseL2Loss=0.1320 + throughput/total_tokens=304,512,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1587/500000] + train/ActionNoiseL2Loss=0.1048 + throughput/total_tokens=304,704,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1588/500000] + train/ActionNoiseL2Loss=0.0976 + throughput/total_tokens=304,896,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1589/500000] + train/ActionNoiseL2Loss=0.1497 + throughput/total_tokens=305,088,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1590/500000] + train/ActionNoiseL2Loss=0.1152 + throughput/total_tokens=305,280,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1591/500000] + train/ActionNoiseL2Loss=0.1493 + throughput/total_tokens=305,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1592/500000] + train/ActionNoiseL2Loss=0.1089 + throughput/total_tokens=305,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1593/500000] + train/ActionNoiseL2Loss=0.1443 + throughput/total_tokens=305,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1594/500000] + train/ActionNoiseL2Loss=0.1171 + throughput/total_tokens=306,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1595/500000] + train/ActionNoiseL2Loss=0.1859 + throughput/total_tokens=306,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1596/500000] + train/ActionNoiseL2Loss=0.0833 + throughput/total_tokens=306,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1597/500000] + train/ActionNoiseL2Loss=0.1393 + throughput/total_tokens=306,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1598/500000] + train/ActionNoiseL2Loss=0.1161 + throughput/total_tokens=306,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1599/500000] + train/ActionNoiseL2Loss=0.1843 + throughput/total_tokens=307,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1600/500000] + optim/total_grad_norm=6.496 + train/ActionNoiseL2Loss=0.1698 + throughput/total_tokens=307,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1601/500000] + train/ActionNoiseL2Loss=0.1035 + throughput/total_tokens=307,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1602/500000] + train/ActionNoiseL2Loss=0.1470 + throughput/total_tokens=307,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1603/500000] + train/ActionNoiseL2Loss=0.1352 + throughput/total_tokens=307,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1604/500000] + train/ActionNoiseL2Loss=0.1438 + throughput/total_tokens=307,968,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1605/500000] + train/ActionNoiseL2Loss=0.1161 + throughput/total_tokens=308,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1606/500000] + train/ActionNoiseL2Loss=0.1061 + throughput/total_tokens=308,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1607/500000] + train/ActionNoiseL2Loss=0.1083 + throughput/total_tokens=308,544,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1608/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=308,736,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1609/500000] + train/ActionNoiseL2Loss=0.1189 + throughput/total_tokens=308,928,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1610/500000] + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=309,120,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1611/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=309,312,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1612/500000] + train/ActionNoiseL2Loss=0.0963 + throughput/total_tokens=309,504,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1613/500000] + train/ActionNoiseL2Loss=0.1230 + throughput/total_tokens=309,696,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1614/500000] + train/ActionNoiseL2Loss=0.1110 + throughput/total_tokens=309,888,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1615/500000] + train/ActionNoiseL2Loss=0.1311 + throughput/total_tokens=310,080,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1616/500000] + train/ActionNoiseL2Loss=0.1026 + throughput/total_tokens=310,272,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1617/500000] + train/ActionNoiseL2Loss=0.1188 + throughput/total_tokens=310,464,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1618/500000] + train/ActionNoiseL2Loss=0.0936 + throughput/total_tokens=310,656,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1619/500000] + train/ActionNoiseL2Loss=0.1285 + throughput/total_tokens=310,848,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1620/500000] + optim/total_grad_norm=1.625 + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=311,040,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=1621/500000] + train/ActionNoiseL2Loss=0.1700 + throughput/total_tokens=311,232,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1622/500000] + train/ActionNoiseL2Loss=0.1209 + throughput/total_tokens=311,424,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1623/500000] + train/ActionNoiseL2Loss=0.1048 + throughput/total_tokens=311,616,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1624/500000] + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=311,808,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1625/500000] + train/ActionNoiseL2Loss=0.1394 + throughput/total_tokens=312,000,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1626/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=312,192,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1627/500000] + train/ActionNoiseL2Loss=0.1168 + throughput/total_tokens=312,384,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1628/500000] + train/ActionNoiseL2Loss=0.2021 + throughput/total_tokens=312,576,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1629/500000] + train/ActionNoiseL2Loss=0.1032 + throughput/total_tokens=312,768,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1630/500000] + train/ActionNoiseL2Loss=0.1087 + throughput/total_tokens=312,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1631/500000] + train/ActionNoiseL2Loss=0.1250 + throughput/total_tokens=313,152,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1632/500000] + train/ActionNoiseL2Loss=0.0978 + throughput/total_tokens=313,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1633/500000] + train/ActionNoiseL2Loss=0.1539 + throughput/total_tokens=313,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1634/500000] + train/ActionNoiseL2Loss=0.0840 + throughput/total_tokens=313,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1635/500000] + train/ActionNoiseL2Loss=0.1483 + throughput/total_tokens=313,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1636/500000] + train/ActionNoiseL2Loss=0.1456 + throughput/total_tokens=314,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1637/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=314,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1638/500000] + train/ActionNoiseL2Loss=0.2020 + throughput/total_tokens=314,496,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1639/500000] + train/ActionNoiseL2Loss=0.1122 + throughput/total_tokens=314,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1640/500000] + optim/total_grad_norm=2.966 + train/ActionNoiseL2Loss=0.1528 + throughput/total_tokens=314,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1641/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=315,072,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1642/500000] + train/ActionNoiseL2Loss=0.2163 + throughput/total_tokens=315,264,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1643/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=315,456,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1644/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=315,648,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1645/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=315,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1646/500000] + train/ActionNoiseL2Loss=0.1104 + throughput/total_tokens=316,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1647/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=316,224,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1648/500000] + train/ActionNoiseL2Loss=0.1487 + throughput/total_tokens=316,416,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1649/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=316,608,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1650/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=316,800,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1651/500000] + train/ActionNoiseL2Loss=0.1023 + throughput/total_tokens=316,992,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1652/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=317,184,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1653/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=317,376,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1654/500000] + train/ActionNoiseL2Loss=0.1161 + throughput/total_tokens=317,568,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1655/500000] + train/ActionNoiseL2Loss=0.1439 + throughput/total_tokens=317,760,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1656/500000] + train/ActionNoiseL2Loss=0.1683 + throughput/total_tokens=317,952,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1657/500000] + train/ActionNoiseL2Loss=0.0937 + throughput/total_tokens=318,144,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1658/500000] + train/ActionNoiseL2Loss=0.1074 + throughput/total_tokens=318,336,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1659/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=318,528,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1660/500000] + optim/total_grad_norm=2.383 + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=318,720,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=1661/500000] + train/ActionNoiseL2Loss=0.1826 + throughput/total_tokens=318,912,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1662/500000] + train/ActionNoiseL2Loss=0.1190 + throughput/total_tokens=319,104,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1663/500000] + train/ActionNoiseL2Loss=0.1608 + throughput/total_tokens=319,296,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1664/500000] + train/ActionNoiseL2Loss=0.1747 + throughput/total_tokens=319,488,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1665/500000] + train/ActionNoiseL2Loss=0.1008 + throughput/total_tokens=319,680,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1666/500000] + train/ActionNoiseL2Loss=0.1187 + throughput/total_tokens=319,872,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1667/500000] + train/ActionNoiseL2Loss=0.1150 + throughput/total_tokens=320,064,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1668/500000] + train/ActionNoiseL2Loss=0.1546 + throughput/total_tokens=320,256,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=1669/500000] + train/ActionNoiseL2Loss=0.1143 + throughput/total_tokens=320,448,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1670/500000] + train/ActionNoiseL2Loss=0.1101 + throughput/total_tokens=320,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1671/500000] + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=320,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1672/500000] + train/ActionNoiseL2Loss=0.0923 + throughput/total_tokens=321,024,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1673/500000] + train/ActionNoiseL2Loss=0.0993 + throughput/total_tokens=321,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1674/500000] + train/ActionNoiseL2Loss=0.1110 + throughput/total_tokens=321,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1675/500000] + train/ActionNoiseL2Loss=0.1412 + throughput/total_tokens=321,600,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1676/500000] + train/ActionNoiseL2Loss=0.1601 + throughput/total_tokens=321,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1677/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=321,984,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1678/500000] + train/ActionNoiseL2Loss=0.1385 + throughput/total_tokens=322,176,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1679/500000] + train/ActionNoiseL2Loss=0.1375 + throughput/total_tokens=322,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1680/500000] + optim/total_grad_norm=2.864 + train/ActionNoiseL2Loss=0.1305 + throughput/total_tokens=322,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1681/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=322,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1682/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=322,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1683/500000] + train/ActionNoiseL2Loss=0.1105 + throughput/total_tokens=323,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1684/500000] + train/ActionNoiseL2Loss=0.0998 + throughput/total_tokens=323,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1685/500000] + train/ActionNoiseL2Loss=0.1728 + throughput/total_tokens=323,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1686/500000] + train/ActionNoiseL2Loss=0.0994 + throughput/total_tokens=323,712,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1687/500000] + train/ActionNoiseL2Loss=0.1132 + throughput/total_tokens=323,904,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1688/500000] + train/ActionNoiseL2Loss=0.1634 + throughput/total_tokens=324,096,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1689/500000] + train/ActionNoiseL2Loss=0.1547 + throughput/total_tokens=324,288,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1690/500000] + train/ActionNoiseL2Loss=0.1008 + throughput/total_tokens=324,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=1691/500000] + train/ActionNoiseL2Loss=0.1480 + throughput/total_tokens=324,672,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1692/500000] + train/ActionNoiseL2Loss=0.1297 + throughput/total_tokens=324,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1693/500000] + train/ActionNoiseL2Loss=0.1521 + throughput/total_tokens=325,056,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1694/500000] + train/ActionNoiseL2Loss=0.1286 + throughput/total_tokens=325,248,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1695/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=325,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1696/500000] + train/ActionNoiseL2Loss=0.1295 + throughput/total_tokens=325,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1697/500000] + train/ActionNoiseL2Loss=0.1706 + throughput/total_tokens=325,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1698/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=326,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1699/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=326,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1700/500000] + optim/total_grad_norm=4.317 + train/ActionNoiseL2Loss=0.1406 + throughput/total_tokens=326,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=1701/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=326,592,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1702/500000] + train/ActionNoiseL2Loss=0.1356 + throughput/total_tokens=326,784,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1703/500000] + train/ActionNoiseL2Loss=0.1434 + throughput/total_tokens=326,976,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1704/500000] + train/ActionNoiseL2Loss=0.1686 + throughput/total_tokens=327,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1705/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=327,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1706/500000] + train/ActionNoiseL2Loss=0.0996 + throughput/total_tokens=327,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1707/500000] + train/ActionNoiseL2Loss=0.1364 + throughput/total_tokens=327,744,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1708/500000] + train/ActionNoiseL2Loss=0.1118 + throughput/total_tokens=327,936,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1709/500000] + train/ActionNoiseL2Loss=0.0983 + throughput/total_tokens=328,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1710/500000] + train/ActionNoiseL2Loss=0.1415 + throughput/total_tokens=328,320,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1711/500000] + train/ActionNoiseL2Loss=0.1486 + throughput/total_tokens=328,512,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1712/500000] + train/ActionNoiseL2Loss=0.0989 + throughput/total_tokens=328,704,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1713/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=328,896,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1714/500000] + train/ActionNoiseL2Loss=0.2131 + throughput/total_tokens=329,088,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1715/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=329,280,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1716/500000] + train/ActionNoiseL2Loss=0.1326 + throughput/total_tokens=329,472,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1717/500000] + train/ActionNoiseL2Loss=0.1307 + throughput/total_tokens=329,664,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1718/500000] + train/ActionNoiseL2Loss=0.1233 + throughput/total_tokens=329,856,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1719/500000] + train/ActionNoiseL2Loss=0.1303 + throughput/total_tokens=330,048,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1720/500000] + optim/total_grad_norm=3.019 + train/ActionNoiseL2Loss=0.1749 + throughput/total_tokens=330,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1721/500000] + train/ActionNoiseL2Loss=0.1370 + throughput/total_tokens=330,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1722/500000] + train/ActionNoiseL2Loss=0.1171 + throughput/total_tokens=330,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1723/500000] + train/ActionNoiseL2Loss=0.1433 + throughput/total_tokens=330,816,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1724/500000] + train/ActionNoiseL2Loss=0.0840 + throughput/total_tokens=331,008,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1725/500000] + train/ActionNoiseL2Loss=0.1060 + throughput/total_tokens=331,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1726/500000] + train/ActionNoiseL2Loss=0.1218 + throughput/total_tokens=331,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1727/500000] + train/ActionNoiseL2Loss=0.1580 + throughput/total_tokens=331,584,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1728/500000] + train/ActionNoiseL2Loss=0.1123 + throughput/total_tokens=331,776,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1729/500000] + train/ActionNoiseL2Loss=0.1333 + throughput/total_tokens=331,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1730/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=332,160,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1731/500000] + train/ActionNoiseL2Loss=0.1233 + throughput/total_tokens=332,352,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1732/500000] + train/ActionNoiseL2Loss=0.0992 + throughput/total_tokens=332,544,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1733/500000] + train/ActionNoiseL2Loss=0.0871 + throughput/total_tokens=332,736,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1734/500000] + train/ActionNoiseL2Loss=0.1007 + throughput/total_tokens=332,928,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1735/500000] + train/ActionNoiseL2Loss=0.1433 + throughput/total_tokens=333,120,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1736/500000] + train/ActionNoiseL2Loss=0.1167 + throughput/total_tokens=333,312,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1737/500000] + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=333,504,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1738/500000] + train/ActionNoiseL2Loss=0.1579 + throughput/total_tokens=333,696,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1739/500000] + train/ActionNoiseL2Loss=0.1340 + throughput/total_tokens=333,888,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1740/500000] + optim/total_grad_norm=2.011 + train/ActionNoiseL2Loss=0.1030 + throughput/total_tokens=334,080,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1741/500000] + train/ActionNoiseL2Loss=0.1747 + throughput/total_tokens=334,272,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1742/500000] + train/ActionNoiseL2Loss=0.1089 + throughput/total_tokens=334,464,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1743/500000] + train/ActionNoiseL2Loss=0.1063 + throughput/total_tokens=334,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1744/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=334,848,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1745/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=335,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1746/500000] + train/ActionNoiseL2Loss=0.0951 + throughput/total_tokens=335,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1747/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=335,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1748/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=335,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1749/500000] + train/ActionNoiseL2Loss=0.0741 + throughput/total_tokens=335,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1750/500000] + train/ActionNoiseL2Loss=0.2277 + throughput/total_tokens=336,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1751/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=336,192,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1752/500000] + train/ActionNoiseL2Loss=0.1294 + throughput/total_tokens=336,384,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1753/500000] + train/ActionNoiseL2Loss=0.1234 + throughput/total_tokens=336,576,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1754/500000] + train/ActionNoiseL2Loss=0.1804 + throughput/total_tokens=336,768,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1755/500000] + train/ActionNoiseL2Loss=0.1156 + throughput/total_tokens=336,960,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1756/500000] + train/ActionNoiseL2Loss=0.1701 + throughput/total_tokens=337,152,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1757/500000] + train/ActionNoiseL2Loss=0.1062 + throughput/total_tokens=337,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1758/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=337,536,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1759/500000] + train/ActionNoiseL2Loss=0.0928 + throughput/total_tokens=337,728,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1760/500000] + optim/total_grad_norm=1.946 + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=337,920,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1761/500000] + train/ActionNoiseL2Loss=0.1174 + throughput/total_tokens=338,112,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1762/500000] + train/ActionNoiseL2Loss=0.1435 + throughput/total_tokens=338,304,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1763/500000] + train/ActionNoiseL2Loss=0.1759 + throughput/total_tokens=338,496,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1764/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=338,688,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1765/500000] + train/ActionNoiseL2Loss=0.0989 + throughput/total_tokens=338,880,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1766/500000] + train/ActionNoiseL2Loss=0.1005 + throughput/total_tokens=339,072,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1767/500000] + train/ActionNoiseL2Loss=0.1113 + throughput/total_tokens=339,264,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1768/500000] + train/ActionNoiseL2Loss=0.1391 + throughput/total_tokens=339,456,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1769/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=339,648,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1770/500000] + train/ActionNoiseL2Loss=0.1193 + throughput/total_tokens=339,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1771/500000] + train/ActionNoiseL2Loss=0.1334 + throughput/total_tokens=340,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1772/500000] + train/ActionNoiseL2Loss=0.1112 + throughput/total_tokens=340,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1773/500000] + train/ActionNoiseL2Loss=0.1942 + throughput/total_tokens=340,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1774/500000] + train/ActionNoiseL2Loss=0.1534 + throughput/total_tokens=340,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1775/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=340,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1776/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=340,992,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1777/500000] + train/ActionNoiseL2Loss=0.1014 + throughput/total_tokens=341,184,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1778/500000] + train/ActionNoiseL2Loss=0.1415 + throughput/total_tokens=341,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1779/500000] + train/ActionNoiseL2Loss=0.1974 + throughput/total_tokens=341,568,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1780/500000] + optim/total_grad_norm=3.279 + train/ActionNoiseL2Loss=0.1613 + throughput/total_tokens=341,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1781/500000] + train/ActionNoiseL2Loss=0.1218 + throughput/total_tokens=341,952,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1782/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=342,144,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1783/500000] + train/ActionNoiseL2Loss=0.1823 + throughput/total_tokens=342,336,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1784/500000] + train/ActionNoiseL2Loss=0.1268 + throughput/total_tokens=342,528,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1785/500000] + train/ActionNoiseL2Loss=0.1755 + throughput/total_tokens=342,720,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1786/500000] + train/ActionNoiseL2Loss=0.0926 + throughput/total_tokens=342,912,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1787/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=343,104,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1788/500000] + train/ActionNoiseL2Loss=0.1044 + throughput/total_tokens=343,296,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1789/500000] + train/ActionNoiseL2Loss=0.0909 + throughput/total_tokens=343,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1790/500000] + train/ActionNoiseL2Loss=0.0999 + throughput/total_tokens=343,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1791/500000] + train/ActionNoiseL2Loss=0.1414 + throughput/total_tokens=343,872,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1792/500000] + train/ActionNoiseL2Loss=0.1256 + throughput/total_tokens=344,064,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1793/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=344,256,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1794/500000] + train/ActionNoiseL2Loss=0.1042 + throughput/total_tokens=344,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1795/500000] + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=344,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1796/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=344,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1797/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=345,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1798/500000] + train/ActionNoiseL2Loss=0.1109 + throughput/total_tokens=345,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1799/500000] + train/ActionNoiseL2Loss=0.1054 + throughput/total_tokens=345,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1800/500000] + optim/total_grad_norm=1.655 + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=345,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1801/500000] + train/ActionNoiseL2Loss=0.1437 + throughput/total_tokens=345,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1802/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=345,984,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1803/500000] + train/ActionNoiseL2Loss=0.1239 + throughput/total_tokens=346,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1804/500000] + train/ActionNoiseL2Loss=0.0936 + throughput/total_tokens=346,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1805/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=346,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1806/500000] + train/ActionNoiseL2Loss=0.0932 + throughput/total_tokens=346,752,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1807/500000] + train/ActionNoiseL2Loss=0.0986 + throughput/total_tokens=346,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1808/500000] + train/ActionNoiseL2Loss=0.1014 + throughput/total_tokens=347,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1809/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=347,328,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1810/500000] + train/ActionNoiseL2Loss=0.1152 + throughput/total_tokens=347,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1811/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=347,712,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1812/500000] + train/ActionNoiseL2Loss=0.1294 + throughput/total_tokens=347,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1813/500000] + train/ActionNoiseL2Loss=0.1095 + throughput/total_tokens=348,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1814/500000] + train/ActionNoiseL2Loss=0.1492 + throughput/total_tokens=348,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1815/500000] + train/ActionNoiseL2Loss=0.1165 + throughput/total_tokens=348,480,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1816/500000] + train/ActionNoiseL2Loss=0.0967 + throughput/total_tokens=348,672,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1817/500000] + train/ActionNoiseL2Loss=0.1081 + throughput/total_tokens=348,864,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1818/500000] + train/ActionNoiseL2Loss=0.0959 + throughput/total_tokens=349,056,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1819/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=349,248,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1820/500000] + optim/total_grad_norm=4.232 + train/ActionNoiseL2Loss=0.1614 + throughput/total_tokens=349,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1821/500000] + train/ActionNoiseL2Loss=0.1702 + throughput/total_tokens=349,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1822/500000] + train/ActionNoiseL2Loss=0.1176 + throughput/total_tokens=349,824,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1823/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=350,016,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1824/500000] + train/ActionNoiseL2Loss=0.1307 + throughput/total_tokens=350,208,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1825/500000] + train/ActionNoiseL2Loss=0.1369 + throughput/total_tokens=350,400,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1826/500000] + train/ActionNoiseL2Loss=0.2047 + throughput/total_tokens=350,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1827/500000] + train/ActionNoiseL2Loss=0.0984 + throughput/total_tokens=350,784,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1828/500000] + train/ActionNoiseL2Loss=0.0944 + throughput/total_tokens=350,976,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1829/500000] + train/ActionNoiseL2Loss=0.1404 + throughput/total_tokens=351,168,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1830/500000] + train/ActionNoiseL2Loss=0.0914 + throughput/total_tokens=351,360,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1831/500000] + train/ActionNoiseL2Loss=0.1068 + throughput/total_tokens=351,552,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1832/500000] + train/ActionNoiseL2Loss=0.0978 + throughput/total_tokens=351,744,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1833/500000] + train/ActionNoiseL2Loss=0.0924 + throughput/total_tokens=351,936,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1834/500000] + train/ActionNoiseL2Loss=0.1685 + throughput/total_tokens=352,128,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1835/500000] + train/ActionNoiseL2Loss=0.1001 + throughput/total_tokens=352,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1836/500000] + train/ActionNoiseL2Loss=0.1298 + throughput/total_tokens=352,512,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1837/500000] + train/ActionNoiseL2Loss=0.0970 + throughput/total_tokens=352,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1838/500000] + train/ActionNoiseL2Loss=0.1290 + throughput/total_tokens=352,896,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1839/500000] + train/ActionNoiseL2Loss=0.1014 + throughput/total_tokens=353,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1840/500000] + optim/total_grad_norm=2.260 + train/ActionNoiseL2Loss=0.1604 + throughput/total_tokens=353,280,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1841/500000] + train/ActionNoiseL2Loss=0.1204 + throughput/total_tokens=353,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1842/500000] + train/ActionNoiseL2Loss=0.1026 + throughput/total_tokens=353,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1843/500000] + train/ActionNoiseL2Loss=0.1273 + throughput/total_tokens=353,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1844/500000] + train/ActionNoiseL2Loss=0.2084 + throughput/total_tokens=354,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1845/500000] + train/ActionNoiseL2Loss=0.0976 + throughput/total_tokens=354,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1846/500000] + train/ActionNoiseL2Loss=0.0997 + throughput/total_tokens=354,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1847/500000] + train/ActionNoiseL2Loss=0.1162 + throughput/total_tokens=354,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1848/500000] + train/ActionNoiseL2Loss=0.1085 + throughput/total_tokens=354,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1849/500000] + train/ActionNoiseL2Loss=0.1359 + throughput/total_tokens=355,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1850/500000] + train/ActionNoiseL2Loss=0.1635 + throughput/total_tokens=355,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1851/500000] + train/ActionNoiseL2Loss=0.1075 + throughput/total_tokens=355,392,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1852/500000] + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=355,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1853/500000] + train/ActionNoiseL2Loss=0.1169 + throughput/total_tokens=355,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1854/500000] + train/ActionNoiseL2Loss=0.1106 + throughput/total_tokens=355,968,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1855/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=356,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1856/500000] + train/ActionNoiseL2Loss=0.1424 + throughput/total_tokens=356,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1857/500000] + train/ActionNoiseL2Loss=0.1768 + throughput/total_tokens=356,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1858/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=356,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1859/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=356,928,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1860/500000] + optim/total_grad_norm=3.523 + train/ActionNoiseL2Loss=0.1598 + throughput/total_tokens=357,120,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=1861/500000] + train/ActionNoiseL2Loss=0.0981 + throughput/total_tokens=357,312,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1862/500000] + train/ActionNoiseL2Loss=0.1640 + throughput/total_tokens=357,504,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1863/500000] + train/ActionNoiseL2Loss=0.1013 + throughput/total_tokens=357,696,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1864/500000] + train/ActionNoiseL2Loss=0.1080 + throughput/total_tokens=357,888,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1865/500000] + train/ActionNoiseL2Loss=0.1421 + throughput/total_tokens=358,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1866/500000] + train/ActionNoiseL2Loss=0.1616 + throughput/total_tokens=358,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1867/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=358,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1868/500000] + train/ActionNoiseL2Loss=0.1041 + throughput/total_tokens=358,656,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1869/500000] + train/ActionNoiseL2Loss=0.1054 + throughput/total_tokens=358,848,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1870/500000] + train/ActionNoiseL2Loss=0.1106 + throughput/total_tokens=359,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1871/500000] + train/ActionNoiseL2Loss=0.1572 + throughput/total_tokens=359,232,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1872/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=359,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1873/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=359,616,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1874/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=359,808,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1875/500000] + train/ActionNoiseL2Loss=0.1224 + throughput/total_tokens=360,000,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1876/500000] + train/ActionNoiseL2Loss=0.1001 + throughput/total_tokens=360,192,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1877/500000] + train/ActionNoiseL2Loss=0.1080 + throughput/total_tokens=360,384,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1878/500000] + train/ActionNoiseL2Loss=0.0905 + throughput/total_tokens=360,576,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=1879/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=360,768,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1880/500000] + optim/total_grad_norm=1.260 + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=360,960,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=1881/500000] + train/ActionNoiseL2Loss=0.1204 + throughput/total_tokens=361,152,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1882/500000] + train/ActionNoiseL2Loss=0.1001 + throughput/total_tokens=361,344,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1883/500000] + train/ActionNoiseL2Loss=0.1158 + throughput/total_tokens=361,536,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1884/500000] + train/ActionNoiseL2Loss=0.1158 + throughput/total_tokens=361,728,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1885/500000] + train/ActionNoiseL2Loss=0.1203 + throughput/total_tokens=361,920,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1886/500000] + train/ActionNoiseL2Loss=0.1350 + throughput/total_tokens=362,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1887/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=362,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1888/500000] + train/ActionNoiseL2Loss=0.0858 + throughput/total_tokens=362,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1889/500000] + train/ActionNoiseL2Loss=0.1129 + throughput/total_tokens=362,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1890/500000] + train/ActionNoiseL2Loss=0.1026 + throughput/total_tokens=362,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1891/500000] + train/ActionNoiseL2Loss=0.1741 + throughput/total_tokens=363,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1892/500000] + train/ActionNoiseL2Loss=0.1010 + throughput/total_tokens=363,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1893/500000] + train/ActionNoiseL2Loss=0.0898 + throughput/total_tokens=363,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1894/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=363,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1895/500000] + train/ActionNoiseL2Loss=0.1048 + throughput/total_tokens=363,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1896/500000] + train/ActionNoiseL2Loss=0.1772 + throughput/total_tokens=364,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1897/500000] + train/ActionNoiseL2Loss=0.1248 + throughput/total_tokens=364,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1898/500000] + train/ActionNoiseL2Loss=0.1324 + throughput/total_tokens=364,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=1899/500000] + train/ActionNoiseL2Loss=0.1590 + throughput/total_tokens=364,608,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=1900/500000] + optim/total_grad_norm=1.793 + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=364,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=1901/500000] + train/ActionNoiseL2Loss=0.2276 + throughput/total_tokens=364,992,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1902/500000] + train/ActionNoiseL2Loss=0.0975 + throughput/total_tokens=365,184,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1903/500000] + train/ActionNoiseL2Loss=0.1019 + throughput/total_tokens=365,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1904/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=365,568,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1905/500000] + train/ActionNoiseL2Loss=0.1623 + throughput/total_tokens=365,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1906/500000] + train/ActionNoiseL2Loss=0.1409 + throughput/total_tokens=365,952,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1907/500000] + train/ActionNoiseL2Loss=0.1169 + throughput/total_tokens=366,144,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1908/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=366,336,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1909/500000] + train/ActionNoiseL2Loss=0.0980 + throughput/total_tokens=366,528,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=1910/500000] + train/ActionNoiseL2Loss=0.0898 + throughput/total_tokens=366,720,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=1911/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=366,912,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1912/500000] + train/ActionNoiseL2Loss=0.1556 + throughput/total_tokens=367,104,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1913/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=367,296,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1914/500000] + train/ActionNoiseL2Loss=0.1116 + throughput/total_tokens=367,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1915/500000] + train/ActionNoiseL2Loss=0.1350 + throughput/total_tokens=367,680,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1916/500000] + train/ActionNoiseL2Loss=0.1211 + throughput/total_tokens=367,872,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=1917/500000] + train/ActionNoiseL2Loss=0.1182 + throughput/total_tokens=368,064,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1918/500000] + train/ActionNoiseL2Loss=0.1386 + throughput/total_tokens=368,256,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1919/500000] + train/ActionNoiseL2Loss=0.0929 + throughput/total_tokens=368,448,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1920/500000] + optim/total_grad_norm=2.620 + train/ActionNoiseL2Loss=0.1472 + throughput/total_tokens=368,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1921/500000] + train/ActionNoiseL2Loss=0.1257 + throughput/total_tokens=368,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1922/500000] + train/ActionNoiseL2Loss=0.1412 + throughput/total_tokens=369,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1923/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=369,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1924/500000] + train/ActionNoiseL2Loss=0.0965 + throughput/total_tokens=369,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1925/500000] + train/ActionNoiseL2Loss=0.0824 + throughput/total_tokens=369,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1926/500000] + train/ActionNoiseL2Loss=0.1612 + throughput/total_tokens=369,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1927/500000] + train/ActionNoiseL2Loss=0.1476 + throughput/total_tokens=369,984,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1928/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=370,176,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1929/500000] + train/ActionNoiseL2Loss=0.1336 + throughput/total_tokens=370,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1930/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=370,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1931/500000] + train/ActionNoiseL2Loss=0.0824 + throughput/total_tokens=370,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1932/500000] + train/ActionNoiseL2Loss=0.1476 + throughput/total_tokens=370,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1933/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=371,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1934/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=371,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1935/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=371,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1936/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=371,712,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1937/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=371,904,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1938/500000] + train/ActionNoiseL2Loss=0.1468 + throughput/total_tokens=372,096,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1939/500000] + train/ActionNoiseL2Loss=0.1285 + throughput/total_tokens=372,288,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1940/500000] + optim/total_grad_norm=2.228 + train/ActionNoiseL2Loss=0.0955 + throughput/total_tokens=372,480,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1941/500000] + train/ActionNoiseL2Loss=0.0879 + throughput/total_tokens=372,672,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1942/500000] + train/ActionNoiseL2Loss=0.1013 + throughput/total_tokens=372,864,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1943/500000] + train/ActionNoiseL2Loss=0.1190 + throughput/total_tokens=373,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1944/500000] + train/ActionNoiseL2Loss=0.1145 + throughput/total_tokens=373,248,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1945/500000] + train/ActionNoiseL2Loss=0.1282 + throughput/total_tokens=373,440,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1946/500000] + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=373,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1947/500000] + train/ActionNoiseL2Loss=0.1671 + throughput/total_tokens=373,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1948/500000] + train/ActionNoiseL2Loss=0.0859 + throughput/total_tokens=374,016,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1949/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=374,208,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=1950/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=374,400,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1951/500000] + train/ActionNoiseL2Loss=0.0939 + throughput/total_tokens=374,592,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1952/500000] + train/ActionNoiseL2Loss=0.1005 + throughput/total_tokens=374,784,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1953/500000] + train/ActionNoiseL2Loss=0.1296 + throughput/total_tokens=374,976,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1954/500000] + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=375,168,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1955/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=375,360,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1956/500000] + train/ActionNoiseL2Loss=0.0961 + throughput/total_tokens=375,552,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1957/500000] + train/ActionNoiseL2Loss=0.1166 + throughput/total_tokens=375,744,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1958/500000] + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=375,936,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1959/500000] + train/ActionNoiseL2Loss=0.1186 + throughput/total_tokens=376,128,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1960/500000] + optim/total_grad_norm=2.251 + train/ActionNoiseL2Loss=0.1385 + throughput/total_tokens=376,320,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=1961/500000] + train/ActionNoiseL2Loss=0.1008 + throughput/total_tokens=376,512,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1962/500000] + train/ActionNoiseL2Loss=0.1092 + throughput/total_tokens=376,704,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1963/500000] + train/ActionNoiseL2Loss=0.1233 + throughput/total_tokens=376,896,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1964/500000] + train/ActionNoiseL2Loss=0.1242 + throughput/total_tokens=377,088,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1965/500000] + train/ActionNoiseL2Loss=0.1177 + throughput/total_tokens=377,280,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1966/500000] + train/ActionNoiseL2Loss=0.1132 + throughput/total_tokens=377,472,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1967/500000] + train/ActionNoiseL2Loss=0.0935 + throughput/total_tokens=377,664,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=1968/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=377,856,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1969/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=378,048,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=1970/500000] + train/ActionNoiseL2Loss=0.0903 + throughput/total_tokens=378,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1971/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=378,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1972/500000] + train/ActionNoiseL2Loss=0.1962 + throughput/total_tokens=378,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1973/500000] + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=378,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1974/500000] + train/ActionNoiseL2Loss=0.1905 + throughput/total_tokens=379,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1975/500000] + train/ActionNoiseL2Loss=0.1374 + throughput/total_tokens=379,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1976/500000] + train/ActionNoiseL2Loss=0.0894 + throughput/total_tokens=379,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1977/500000] + train/ActionNoiseL2Loss=0.1203 + throughput/total_tokens=379,584,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1978/500000] + train/ActionNoiseL2Loss=0.1234 + throughput/total_tokens=379,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1979/500000] + train/ActionNoiseL2Loss=0.1472 + throughput/total_tokens=379,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1980/500000] + optim/total_grad_norm=1.700 + train/ActionNoiseL2Loss=0.0961 + throughput/total_tokens=380,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1981/500000] + train/ActionNoiseL2Loss=0.1743 + throughput/total_tokens=380,352,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1982/500000] + train/ActionNoiseL2Loss=0.1406 + throughput/total_tokens=380,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1983/500000] + train/ActionNoiseL2Loss=0.0982 + throughput/total_tokens=380,736,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1984/500000] + train/ActionNoiseL2Loss=0.0853 + throughput/total_tokens=380,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1985/500000] + train/ActionNoiseL2Loss=0.1244 + throughput/total_tokens=381,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1986/500000] + train/ActionNoiseL2Loss=0.1643 + throughput/total_tokens=381,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1987/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=381,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=1988/500000] + train/ActionNoiseL2Loss=0.1001 + throughput/total_tokens=381,696,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1989/500000] + train/ActionNoiseL2Loss=0.0983 + throughput/total_tokens=381,888,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1990/500000] + train/ActionNoiseL2Loss=0.0907 + throughput/total_tokens=382,080,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=1991/500000] + train/ActionNoiseL2Loss=0.1295 + throughput/total_tokens=382,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1992/500000] + train/ActionNoiseL2Loss=0.1291 + throughput/total_tokens=382,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1993/500000] + train/ActionNoiseL2Loss=0.1419 + throughput/total_tokens=382,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1994/500000] + train/ActionNoiseL2Loss=0.1269 + throughput/total_tokens=382,848,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1995/500000] + train/ActionNoiseL2Loss=0.1390 + throughput/total_tokens=383,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1996/500000] + train/ActionNoiseL2Loss=0.0977 + throughput/total_tokens=383,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1997/500000] + train/ActionNoiseL2Loss=0.1110 + throughput/total_tokens=383,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1998/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=383,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=1999/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=383,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2000/500000] + optim/total_grad_norm=1.248 + train/ActionNoiseL2Loss=0.0989 + throughput/total_tokens=384,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +10/12 [04:33:09] INFO | >> Saving config... checkpoint.py:608 +10/12 [04:33:41] INFO | >> Saving model state... checkpoint.py:796 +10/12 [04:34:50] INFO | >> Saving optim state... checkpoint.py:811 +10/12 [04:36:21] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=2001/500000] + train/ActionNoiseL2Loss=0.1078 + throughput/total_tokens=384,192,000 + throughput/device/tokens_per_second=1,137 + throughput/device/batches_per_second=0.0474 +[step=2002/500000] + train/ActionNoiseL2Loss=0.1802 + throughput/total_tokens=384,384,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=2003/500000] + train/ActionNoiseL2Loss=0.0949 + throughput/total_tokens=384,576,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2004/500000] + train/ActionNoiseL2Loss=0.1111 + throughput/total_tokens=384,768,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2005/500000] + train/ActionNoiseL2Loss=0.1729 + throughput/total_tokens=384,960,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2006/500000] + train/ActionNoiseL2Loss=0.1027 + throughput/total_tokens=385,152,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2007/500000] + train/ActionNoiseL2Loss=0.1139 + throughput/total_tokens=385,344,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2008/500000] + train/ActionNoiseL2Loss=0.0961 + throughput/total_tokens=385,536,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2009/500000] + train/ActionNoiseL2Loss=0.1197 + throughput/total_tokens=385,728,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2010/500000] + train/ActionNoiseL2Loss=0.1092 + throughput/total_tokens=385,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2011/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=386,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2012/500000] + train/ActionNoiseL2Loss=0.1766 + throughput/total_tokens=386,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2013/500000] + train/ActionNoiseL2Loss=0.0972 + throughput/total_tokens=386,496,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2014/500000] + train/ActionNoiseL2Loss=0.0921 + throughput/total_tokens=386,688,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2015/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=386,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2016/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=387,072,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2017/500000] + train/ActionNoiseL2Loss=0.0937 + throughput/total_tokens=387,264,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2018/500000] + train/ActionNoiseL2Loss=0.1102 + throughput/total_tokens=387,456,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2019/500000] + train/ActionNoiseL2Loss=0.0899 + throughput/total_tokens=387,648,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2020/500000] + optim/total_grad_norm=2.504 + train/ActionNoiseL2Loss=0.0902 + throughput/total_tokens=387,840,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2021/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=388,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2022/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=388,224,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2023/500000] + train/ActionNoiseL2Loss=0.0961 + throughput/total_tokens=388,416,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2024/500000] + train/ActionNoiseL2Loss=0.1443 + throughput/total_tokens=388,608,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2025/500000] + train/ActionNoiseL2Loss=0.1506 + throughput/total_tokens=388,800,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2026/500000] + train/ActionNoiseL2Loss=0.0950 + throughput/total_tokens=388,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2027/500000] + train/ActionNoiseL2Loss=0.0915 + throughput/total_tokens=389,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2028/500000] + train/ActionNoiseL2Loss=0.1082 + throughput/total_tokens=389,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2029/500000] + train/ActionNoiseL2Loss=0.1270 + throughput/total_tokens=389,568,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2030/500000] + train/ActionNoiseL2Loss=0.1278 + throughput/total_tokens=389,760,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2031/500000] + train/ActionNoiseL2Loss=0.1251 + throughput/total_tokens=389,952,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2032/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=390,144,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2033/500000] + train/ActionNoiseL2Loss=0.1078 + throughput/total_tokens=390,336,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2034/500000] + train/ActionNoiseL2Loss=0.1340 + throughput/total_tokens=390,528,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2035/500000] + train/ActionNoiseL2Loss=0.1120 + throughput/total_tokens=390,720,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2036/500000] + train/ActionNoiseL2Loss=0.1147 + throughput/total_tokens=390,912,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2037/500000] + train/ActionNoiseL2Loss=0.0970 + throughput/total_tokens=391,104,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2038/500000] + train/ActionNoiseL2Loss=0.1133 + throughput/total_tokens=391,296,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2039/500000] + train/ActionNoiseL2Loss=0.1844 + throughput/total_tokens=391,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2040/500000] + optim/total_grad_norm=3.497 + train/ActionNoiseL2Loss=0.1780 + throughput/total_tokens=391,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2041/500000] + train/ActionNoiseL2Loss=0.1647 + throughput/total_tokens=391,872,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2042/500000] + train/ActionNoiseL2Loss=0.0881 + throughput/total_tokens=392,064,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2043/500000] + train/ActionNoiseL2Loss=0.1051 + throughput/total_tokens=392,256,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2044/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=392,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2045/500000] + train/ActionNoiseL2Loss=0.1065 + throughput/total_tokens=392,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2046/500000] + train/ActionNoiseL2Loss=0.1019 + throughput/total_tokens=392,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2047/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=393,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2048/500000] + train/ActionNoiseL2Loss=0.1321 + throughput/total_tokens=393,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2049/500000] + train/ActionNoiseL2Loss=0.1069 + throughput/total_tokens=393,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2050/500000] + train/ActionNoiseL2Loss=0.1282 + throughput/total_tokens=393,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2051/500000] + train/ActionNoiseL2Loss=0.1221 + throughput/total_tokens=393,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2052/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=393,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2053/500000] + train/ActionNoiseL2Loss=0.1275 + throughput/total_tokens=394,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2054/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=394,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2055/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=394,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2056/500000] + train/ActionNoiseL2Loss=0.1010 + throughput/total_tokens=394,752,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2057/500000] + train/ActionNoiseL2Loss=0.1588 + throughput/total_tokens=394,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2058/500000] + train/ActionNoiseL2Loss=0.0945 + throughput/total_tokens=395,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2059/500000] + train/ActionNoiseL2Loss=0.0904 + throughput/total_tokens=395,328,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2060/500000] + optim/total_grad_norm=1.623 + train/ActionNoiseL2Loss=0.1091 + throughput/total_tokens=395,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2061/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=395,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2062/500000] + train/ActionNoiseL2Loss=0.1285 + throughput/total_tokens=395,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2063/500000] + train/ActionNoiseL2Loss=0.0863 + throughput/total_tokens=396,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2064/500000] + train/ActionNoiseL2Loss=0.1189 + throughput/total_tokens=396,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2065/500000] + train/ActionNoiseL2Loss=0.0863 + throughput/total_tokens=396,480,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2066/500000] + train/ActionNoiseL2Loss=0.0836 + throughput/total_tokens=396,672,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2067/500000] + train/ActionNoiseL2Loss=0.1056 + throughput/total_tokens=396,864,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2068/500000] + train/ActionNoiseL2Loss=0.1253 + throughput/total_tokens=397,056,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2069/500000] + train/ActionNoiseL2Loss=0.1028 + throughput/total_tokens=397,248,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2070/500000] + train/ActionNoiseL2Loss=0.0957 + throughput/total_tokens=397,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2071/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=397,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2072/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=397,824,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2073/500000] + train/ActionNoiseL2Loss=0.1290 + throughput/total_tokens=398,016,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2074/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=398,208,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2075/500000] + train/ActionNoiseL2Loss=0.1304 + throughput/total_tokens=398,400,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2076/500000] + train/ActionNoiseL2Loss=0.0965 + throughput/total_tokens=398,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2077/500000] + train/ActionNoiseL2Loss=0.1332 + throughput/total_tokens=398,784,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2078/500000] + train/ActionNoiseL2Loss=0.1014 + throughput/total_tokens=398,976,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2079/500000] + train/ActionNoiseL2Loss=0.1403 + throughput/total_tokens=399,168,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2080/500000] + optim/total_grad_norm=1.626 + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=399,360,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2081/500000] + train/ActionNoiseL2Loss=0.1000 + throughput/total_tokens=399,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2082/500000] + train/ActionNoiseL2Loss=0.1709 + throughput/total_tokens=399,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2083/500000] + train/ActionNoiseL2Loss=0.1213 + throughput/total_tokens=399,936,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2084/500000] + train/ActionNoiseL2Loss=0.0975 + throughput/total_tokens=400,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2085/500000] + train/ActionNoiseL2Loss=0.0984 + throughput/total_tokens=400,320,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2086/500000] + train/ActionNoiseL2Loss=0.1133 + throughput/total_tokens=400,512,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2087/500000] + train/ActionNoiseL2Loss=0.1054 + throughput/total_tokens=400,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2088/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=400,896,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2089/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=401,088,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2090/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=401,280,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2091/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=401,472,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2092/500000] + train/ActionNoiseL2Loss=0.1137 + throughput/total_tokens=401,664,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2093/500000] + train/ActionNoiseL2Loss=0.1634 + throughput/total_tokens=401,856,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2094/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=402,048,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2095/500000] + train/ActionNoiseL2Loss=0.1177 + throughput/total_tokens=402,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2096/500000] + train/ActionNoiseL2Loss=0.1302 + throughput/total_tokens=402,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2097/500000] + train/ActionNoiseL2Loss=0.1166 + throughput/total_tokens=402,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2098/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=402,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2099/500000] + train/ActionNoiseL2Loss=0.0911 + throughput/total_tokens=403,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2100/500000] + optim/total_grad_norm=1.154 + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=403,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2101/500000] + train/ActionNoiseL2Loss=0.1479 + throughput/total_tokens=403,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2102/500000] + train/ActionNoiseL2Loss=0.1032 + throughput/total_tokens=403,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2103/500000] + train/ActionNoiseL2Loss=0.1063 + throughput/total_tokens=403,776,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2104/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=403,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2105/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=404,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2106/500000] + train/ActionNoiseL2Loss=0.1001 + throughput/total_tokens=404,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2107/500000] + train/ActionNoiseL2Loss=0.0943 + throughput/total_tokens=404,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2108/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=404,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2109/500000] + train/ActionNoiseL2Loss=0.0947 + throughput/total_tokens=404,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2110/500000] + train/ActionNoiseL2Loss=0.1394 + throughput/total_tokens=405,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2111/500000] + train/ActionNoiseL2Loss=0.1190 + throughput/total_tokens=405,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2112/500000] + train/ActionNoiseL2Loss=0.1147 + throughput/total_tokens=405,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2113/500000] + train/ActionNoiseL2Loss=0.1034 + throughput/total_tokens=405,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2114/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=405,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2115/500000] + train/ActionNoiseL2Loss=0.0898 + throughput/total_tokens=406,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2116/500000] + train/ActionNoiseL2Loss=0.1323 + throughput/total_tokens=406,272,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2117/500000] + train/ActionNoiseL2Loss=0.1163 + throughput/total_tokens=406,464,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2118/500000] + train/ActionNoiseL2Loss=0.1340 + throughput/total_tokens=406,656,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2119/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=406,848,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2120/500000] + optim/total_grad_norm=1.624 + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=407,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2121/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=407,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2122/500000] + train/ActionNoiseL2Loss=0.0994 + throughput/total_tokens=407,424,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2123/500000] + train/ActionNoiseL2Loss=0.0896 + throughput/total_tokens=407,616,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2124/500000] + train/ActionNoiseL2Loss=0.1128 + throughput/total_tokens=407,808,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2125/500000] + train/ActionNoiseL2Loss=0.1088 + throughput/total_tokens=408,000,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2126/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=408,192,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2127/500000] + train/ActionNoiseL2Loss=0.0876 + throughput/total_tokens=408,384,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2128/500000] + train/ActionNoiseL2Loss=0.1210 + throughput/total_tokens=408,576,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2129/500000] + train/ActionNoiseL2Loss=0.1312 + throughput/total_tokens=408,768,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2130/500000] + train/ActionNoiseL2Loss=0.1041 + throughput/total_tokens=408,960,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2131/500000] + train/ActionNoiseL2Loss=0.0872 + throughput/total_tokens=409,152,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2132/500000] + train/ActionNoiseL2Loss=0.1232 + throughput/total_tokens=409,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2133/500000] + train/ActionNoiseL2Loss=0.0893 + throughput/total_tokens=409,536,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2134/500000] + train/ActionNoiseL2Loss=0.1584 + throughput/total_tokens=409,728,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2135/500000] + train/ActionNoiseL2Loss=0.1108 + throughput/total_tokens=409,920,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2136/500000] + train/ActionNoiseL2Loss=0.1031 + throughput/total_tokens=410,112,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2137/500000] + train/ActionNoiseL2Loss=0.1210 + throughput/total_tokens=410,304,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2138/500000] + train/ActionNoiseL2Loss=0.1232 + throughput/total_tokens=410,496,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2139/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=410,688,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2140/500000] + optim/total_grad_norm=2.733 + train/ActionNoiseL2Loss=0.1036 + throughput/total_tokens=410,880,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2141/500000] + train/ActionNoiseL2Loss=0.0931 + throughput/total_tokens=411,072,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2142/500000] + train/ActionNoiseL2Loss=0.1270 + throughput/total_tokens=411,264,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2143/500000] + train/ActionNoiseL2Loss=0.0792 + throughput/total_tokens=411,456,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2144/500000] + train/ActionNoiseL2Loss=0.1499 + throughput/total_tokens=411,648,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2145/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=411,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2146/500000] + train/ActionNoiseL2Loss=0.0948 + throughput/total_tokens=412,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2147/500000] + train/ActionNoiseL2Loss=0.1186 + throughput/total_tokens=412,224,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2148/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=412,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2149/500000] + train/ActionNoiseL2Loss=0.1014 + throughput/total_tokens=412,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2150/500000] + train/ActionNoiseL2Loss=0.1982 + throughput/total_tokens=412,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2151/500000] + train/ActionNoiseL2Loss=0.1525 + throughput/total_tokens=412,992,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2152/500000] + train/ActionNoiseL2Loss=0.1535 + throughput/total_tokens=413,184,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2153/500000] + train/ActionNoiseL2Loss=0.1304 + throughput/total_tokens=413,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2154/500000] + train/ActionNoiseL2Loss=0.1048 + throughput/total_tokens=413,568,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2155/500000] + train/ActionNoiseL2Loss=0.0820 + throughput/total_tokens=413,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2156/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=413,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2157/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=414,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2158/500000] + train/ActionNoiseL2Loss=0.0993 + throughput/total_tokens=414,336,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2159/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=414,528,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2160/500000] + optim/total_grad_norm=1.674 + train/ActionNoiseL2Loss=0.1287 + throughput/total_tokens=414,720,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2161/500000] + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=414,912,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2162/500000] + train/ActionNoiseL2Loss=0.0957 + throughput/total_tokens=415,104,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2163/500000] + train/ActionNoiseL2Loss=0.0898 + throughput/total_tokens=415,296,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2164/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=415,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2165/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=415,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2166/500000] + train/ActionNoiseL2Loss=0.0965 + throughput/total_tokens=415,872,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2167/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=416,064,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2168/500000] + train/ActionNoiseL2Loss=0.0926 + throughput/total_tokens=416,256,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2169/500000] + train/ActionNoiseL2Loss=0.1309 + throughput/total_tokens=416,448,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2170/500000] + train/ActionNoiseL2Loss=0.0851 + throughput/total_tokens=416,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2171/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=416,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2172/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=417,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2173/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=417,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2174/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=417,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2175/500000] + train/ActionNoiseL2Loss=0.1157 + throughput/total_tokens=417,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2176/500000] + train/ActionNoiseL2Loss=0.1189 + throughput/total_tokens=417,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2177/500000] + train/ActionNoiseL2Loss=0.1661 + throughput/total_tokens=417,984,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2178/500000] + train/ActionNoiseL2Loss=0.0833 + throughput/total_tokens=418,176,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2179/500000] + train/ActionNoiseL2Loss=0.1726 + throughput/total_tokens=418,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2180/500000] + optim/total_grad_norm=1.258 + train/ActionNoiseL2Loss=0.0928 + throughput/total_tokens=418,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2181/500000] + train/ActionNoiseL2Loss=0.0843 + throughput/total_tokens=418,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2182/500000] + train/ActionNoiseL2Loss=0.0949 + throughput/total_tokens=418,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2183/500000] + train/ActionNoiseL2Loss=0.1551 + throughput/total_tokens=419,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2184/500000] + train/ActionNoiseL2Loss=0.1098 + throughput/total_tokens=419,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2185/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=419,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2186/500000] + train/ActionNoiseL2Loss=0.1118 + throughput/total_tokens=419,712,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2187/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=419,904,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2188/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=420,096,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2189/500000] + train/ActionNoiseL2Loss=0.1018 + throughput/total_tokens=420,288,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2190/500000] + train/ActionNoiseL2Loss=0.1440 + throughput/total_tokens=420,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2191/500000] + train/ActionNoiseL2Loss=0.1179 + throughput/total_tokens=420,672,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2192/500000] + train/ActionNoiseL2Loss=0.1529 + throughput/total_tokens=420,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2193/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=421,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2194/500000] + train/ActionNoiseL2Loss=0.1795 + throughput/total_tokens=421,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2195/500000] + train/ActionNoiseL2Loss=0.0978 + throughput/total_tokens=421,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2196/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=421,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2197/500000] + train/ActionNoiseL2Loss=0.0939 + throughput/total_tokens=421,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2198/500000] + train/ActionNoiseL2Loss=0.0945 + throughput/total_tokens=422,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2199/500000] + train/ActionNoiseL2Loss=0.1215 + throughput/total_tokens=422,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2200/500000] + optim/total_grad_norm=1.391 + train/ActionNoiseL2Loss=0.0951 + throughput/total_tokens=422,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2201/500000] + train/ActionNoiseL2Loss=0.0833 + throughput/total_tokens=422,592,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2202/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=422,784,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2203/500000] + train/ActionNoiseL2Loss=0.1046 + throughput/total_tokens=422,976,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2204/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=423,168,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2205/500000] + train/ActionNoiseL2Loss=0.1897 + throughput/total_tokens=423,360,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2206/500000] + train/ActionNoiseL2Loss=0.1379 + throughput/total_tokens=423,552,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2207/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=423,744,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2208/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=423,936,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2209/500000] + train/ActionNoiseL2Loss=0.1428 + throughput/total_tokens=424,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2210/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=424,320,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=2211/500000] + train/ActionNoiseL2Loss=0.0969 + throughput/total_tokens=424,512,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2212/500000] + train/ActionNoiseL2Loss=0.0691 + throughput/total_tokens=424,704,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2213/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=424,896,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2214/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=425,088,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2215/500000] + train/ActionNoiseL2Loss=0.0772 + throughput/total_tokens=425,280,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2216/500000] + train/ActionNoiseL2Loss=0.0920 + throughput/total_tokens=425,472,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2217/500000] + train/ActionNoiseL2Loss=0.1346 + throughput/total_tokens=425,664,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2218/500000] + train/ActionNoiseL2Loss=0.1244 + throughput/total_tokens=425,856,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2219/500000] + train/ActionNoiseL2Loss=0.1708 + throughput/total_tokens=426,048,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2220/500000] + optim/total_grad_norm=2.099 + train/ActionNoiseL2Loss=0.1054 + throughput/total_tokens=426,240,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2221/500000] + train/ActionNoiseL2Loss=0.0878 + throughput/total_tokens=426,432,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2222/500000] + train/ActionNoiseL2Loss=0.0896 + throughput/total_tokens=426,624,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2223/500000] + train/ActionNoiseL2Loss=0.1741 + throughput/total_tokens=426,816,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2224/500000] + train/ActionNoiseL2Loss=0.0961 + throughput/total_tokens=427,008,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2225/500000] + train/ActionNoiseL2Loss=0.0981 + throughput/total_tokens=427,200,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2226/500000] + train/ActionNoiseL2Loss=0.1630 + throughput/total_tokens=427,392,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2227/500000] + train/ActionNoiseL2Loss=0.1292 + throughput/total_tokens=427,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2228/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=427,776,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2229/500000] + train/ActionNoiseL2Loss=0.0792 + throughput/total_tokens=427,968,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2230/500000] + train/ActionNoiseL2Loss=0.0942 + throughput/total_tokens=428,160,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=2231/500000] + train/ActionNoiseL2Loss=0.1251 + throughput/total_tokens=428,352,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2232/500000] + train/ActionNoiseL2Loss=0.0945 + throughput/total_tokens=428,544,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2233/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=428,736,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2234/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=428,928,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2235/500000] + train/ActionNoiseL2Loss=0.1694 + throughput/total_tokens=429,120,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2236/500000] + train/ActionNoiseL2Loss=0.0955 + throughput/total_tokens=429,312,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2237/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=429,504,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2238/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=429,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2239/500000] + train/ActionNoiseL2Loss=0.1334 + throughput/total_tokens=429,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2240/500000] + optim/total_grad_norm=2.425 + train/ActionNoiseL2Loss=0.1276 + throughput/total_tokens=430,080,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2241/500000] + train/ActionNoiseL2Loss=0.0931 + throughput/total_tokens=430,272,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2242/500000] + train/ActionNoiseL2Loss=0.1000 + throughput/total_tokens=430,464,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2243/500000] + train/ActionNoiseL2Loss=0.1134 + throughput/total_tokens=430,656,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2244/500000] + train/ActionNoiseL2Loss=0.1030 + throughput/total_tokens=430,848,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2245/500000] + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=431,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2246/500000] + train/ActionNoiseL2Loss=0.1045 + throughput/total_tokens=431,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2247/500000] + train/ActionNoiseL2Loss=0.1092 + throughput/total_tokens=431,424,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2248/500000] + train/ActionNoiseL2Loss=0.1111 + throughput/total_tokens=431,616,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2249/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=431,808,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2250/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=432,000,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2251/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=432,192,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2252/500000] + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=432,384,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2253/500000] + train/ActionNoiseL2Loss=0.1121 + throughput/total_tokens=432,576,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2254/500000] + train/ActionNoiseL2Loss=0.0970 + throughput/total_tokens=432,768,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2255/500000] + train/ActionNoiseL2Loss=0.1000 + throughput/total_tokens=432,960,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2256/500000] + train/ActionNoiseL2Loss=0.1344 + throughput/total_tokens=433,152,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2257/500000] + train/ActionNoiseL2Loss=0.1257 + throughput/total_tokens=433,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2258/500000] + train/ActionNoiseL2Loss=0.0851 + throughput/total_tokens=433,536,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2259/500000] + train/ActionNoiseL2Loss=0.1393 + throughput/total_tokens=433,728,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2260/500000] + optim/total_grad_norm=0.9670 + train/ActionNoiseL2Loss=0.0848 + throughput/total_tokens=433,920,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2261/500000] + train/ActionNoiseL2Loss=0.1545 + throughput/total_tokens=434,112,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2262/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=434,304,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2263/500000] + train/ActionNoiseL2Loss=0.0925 + throughput/total_tokens=434,496,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2264/500000] + train/ActionNoiseL2Loss=0.1814 + throughput/total_tokens=434,688,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2265/500000] + train/ActionNoiseL2Loss=0.1554 + throughput/total_tokens=434,880,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2266/500000] + train/ActionNoiseL2Loss=0.1145 + throughput/total_tokens=435,072,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2267/500000] + train/ActionNoiseL2Loss=0.1174 + throughput/total_tokens=435,264,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2268/500000] + train/ActionNoiseL2Loss=0.1258 + throughput/total_tokens=435,456,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2269/500000] + train/ActionNoiseL2Loss=0.0898 + throughput/total_tokens=435,648,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2270/500000] + train/ActionNoiseL2Loss=0.1078 + throughput/total_tokens=435,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2271/500000] + train/ActionNoiseL2Loss=0.1249 + throughput/total_tokens=436,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2272/500000] + train/ActionNoiseL2Loss=0.1069 + throughput/total_tokens=436,224,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2273/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=436,416,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2274/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=436,608,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2275/500000] + train/ActionNoiseL2Loss=0.1041 + throughput/total_tokens=436,800,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2276/500000] + train/ActionNoiseL2Loss=0.1200 + throughput/total_tokens=436,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2277/500000] + train/ActionNoiseL2Loss=0.1201 + throughput/total_tokens=437,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2278/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=437,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2279/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=437,568,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2280/500000] + optim/total_grad_norm=1.446 + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=437,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2281/500000] + train/ActionNoiseL2Loss=0.1447 + throughput/total_tokens=437,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2282/500000] + train/ActionNoiseL2Loss=0.1030 + throughput/total_tokens=438,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2283/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=438,336,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2284/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=438,528,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2285/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=438,720,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2286/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=438,912,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2287/500000] + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=439,104,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2288/500000] + train/ActionNoiseL2Loss=0.1293 + throughput/total_tokens=439,296,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2289/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=439,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2290/500000] + train/ActionNoiseL2Loss=0.1222 + throughput/total_tokens=439,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2291/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=439,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2292/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=440,064,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2293/500000] + train/ActionNoiseL2Loss=0.1089 + throughput/total_tokens=440,256,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2294/500000] + train/ActionNoiseL2Loss=0.1605 + throughput/total_tokens=440,448,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2295/500000] + train/ActionNoiseL2Loss=0.0871 + throughput/total_tokens=440,640,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2296/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=440,832,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2297/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=441,024,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2298/500000] + train/ActionNoiseL2Loss=0.1520 + throughput/total_tokens=441,216,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2299/500000] + train/ActionNoiseL2Loss=0.0823 + throughput/total_tokens=441,408,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2300/500000] + optim/total_grad_norm=2.199 + train/ActionNoiseL2Loss=0.1180 + throughput/total_tokens=441,600,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2301/500000] + train/ActionNoiseL2Loss=0.1147 + throughput/total_tokens=441,792,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=2302/500000] + train/ActionNoiseL2Loss=0.0802 + throughput/total_tokens=441,984,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=2303/500000] + train/ActionNoiseL2Loss=0.0903 + throughput/total_tokens=442,176,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=2304/500000] + train/ActionNoiseL2Loss=0.1805 + throughput/total_tokens=442,368,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=2305/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=442,560,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=2306/500000] + train/ActionNoiseL2Loss=0.0785 + throughput/total_tokens=442,752,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=2307/500000] + train/ActionNoiseL2Loss=0.1046 + throughput/total_tokens=442,944,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=2308/500000] + train/ActionNoiseL2Loss=0.1197 + throughput/total_tokens=443,136,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=2309/500000] + train/ActionNoiseL2Loss=0.0945 + throughput/total_tokens=443,328,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=2310/500000] + train/ActionNoiseL2Loss=0.1145 + throughput/total_tokens=443,520,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 + System/Peak GPU Memory (MB)=51,076 +[step=2311/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=443,712,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=2312/500000] + train/ActionNoiseL2Loss=0.1177 + throughput/total_tokens=443,904,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=2313/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=444,096,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=2314/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=444,288,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=2315/500000] + train/ActionNoiseL2Loss=0.0916 + throughput/total_tokens=444,480,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=2316/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=444,672,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=2317/500000] + train/ActionNoiseL2Loss=0.0942 + throughput/total_tokens=444,864,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=2318/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=445,056,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=2319/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=445,248,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2320/500000] + optim/total_grad_norm=1.980 + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=445,440,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2321/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=445,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2322/500000] + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=445,824,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2323/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=446,016,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2324/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=446,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2325/500000] + train/ActionNoiseL2Loss=0.1456 + throughput/total_tokens=446,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2326/500000] + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=446,592,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2327/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=446,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2328/500000] + train/ActionNoiseL2Loss=0.1131 + throughput/total_tokens=446,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2329/500000] + train/ActionNoiseL2Loss=0.0997 + throughput/total_tokens=447,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2330/500000] + train/ActionNoiseL2Loss=0.0884 + throughput/total_tokens=447,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2331/500000] + train/ActionNoiseL2Loss=0.1355 + throughput/total_tokens=447,552,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2332/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=447,744,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2333/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=447,936,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2334/500000] + train/ActionNoiseL2Loss=0.0927 + throughput/total_tokens=448,128,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2335/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=448,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2336/500000] + train/ActionNoiseL2Loss=0.1060 + throughput/total_tokens=448,512,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2337/500000] + train/ActionNoiseL2Loss=0.1188 + throughput/total_tokens=448,704,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2338/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=448,896,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2339/500000] + train/ActionNoiseL2Loss=0.1377 + throughput/total_tokens=449,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2340/500000] + optim/total_grad_norm=1.693 + train/ActionNoiseL2Loss=0.0947 + throughput/total_tokens=449,280,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2341/500000] + train/ActionNoiseL2Loss=0.1036 + throughput/total_tokens=449,472,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2342/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=449,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2343/500000] + train/ActionNoiseL2Loss=0.0991 + throughput/total_tokens=449,856,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2344/500000] + train/ActionNoiseL2Loss=0.0709 + throughput/total_tokens=450,048,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2345/500000] + train/ActionNoiseL2Loss=0.0989 + throughput/total_tokens=450,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2346/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=450,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2347/500000] + train/ActionNoiseL2Loss=0.1174 + throughput/total_tokens=450,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2348/500000] + train/ActionNoiseL2Loss=0.1372 + throughput/total_tokens=450,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2349/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=451,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2350/500000] + train/ActionNoiseL2Loss=0.0898 + throughput/total_tokens=451,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2351/500000] + train/ActionNoiseL2Loss=0.1530 + throughput/total_tokens=451,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2352/500000] + train/ActionNoiseL2Loss=0.1199 + throughput/total_tokens=451,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2353/500000] + train/ActionNoiseL2Loss=0.1094 + throughput/total_tokens=451,776,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2354/500000] + train/ActionNoiseL2Loss=0.1631 + throughput/total_tokens=451,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2355/500000] + train/ActionNoiseL2Loss=0.0894 + throughput/total_tokens=452,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2356/500000] + train/ActionNoiseL2Loss=0.1267 + throughput/total_tokens=452,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2357/500000] + train/ActionNoiseL2Loss=0.0957 + throughput/total_tokens=452,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2358/500000] + train/ActionNoiseL2Loss=0.1213 + throughput/total_tokens=452,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2359/500000] + train/ActionNoiseL2Loss=0.1091 + throughput/total_tokens=452,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2360/500000] + optim/total_grad_norm=2.404 + train/ActionNoiseL2Loss=0.1077 + throughput/total_tokens=453,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2361/500000] + train/ActionNoiseL2Loss=0.1343 + throughput/total_tokens=453,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2362/500000] + train/ActionNoiseL2Loss=0.0865 + throughput/total_tokens=453,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2363/500000] + train/ActionNoiseL2Loss=0.1017 + throughput/total_tokens=453,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2364/500000] + train/ActionNoiseL2Loss=0.1164 + throughput/total_tokens=453,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2365/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=454,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2366/500000] + train/ActionNoiseL2Loss=0.1352 + throughput/total_tokens=454,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2367/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=454,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2368/500000] + train/ActionNoiseL2Loss=0.0967 + throughput/total_tokens=454,656,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2369/500000] + train/ActionNoiseL2Loss=0.1184 + throughput/total_tokens=454,848,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2370/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=455,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2371/500000] + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=455,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2372/500000] + train/ActionNoiseL2Loss=0.1232 + throughput/total_tokens=455,424,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2373/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=455,616,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2374/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=455,808,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2375/500000] + train/ActionNoiseL2Loss=0.1715 + throughput/total_tokens=456,000,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2376/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=456,192,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2377/500000] + train/ActionNoiseL2Loss=0.1499 + throughput/total_tokens=456,384,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2378/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=456,576,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2379/500000] + train/ActionNoiseL2Loss=0.0944 + throughput/total_tokens=456,768,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2380/500000] + optim/total_grad_norm=0.8900 + train/ActionNoiseL2Loss=0.0914 + throughput/total_tokens=456,960,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2381/500000] + train/ActionNoiseL2Loss=0.1254 + throughput/total_tokens=457,152,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2382/500000] + train/ActionNoiseL2Loss=0.1112 + throughput/total_tokens=457,344,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2383/500000] + train/ActionNoiseL2Loss=0.1422 + throughput/total_tokens=457,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2384/500000] + train/ActionNoiseL2Loss=0.0858 + throughput/total_tokens=457,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2385/500000] + train/ActionNoiseL2Loss=0.1571 + throughput/total_tokens=457,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2386/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=458,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2387/500000] + train/ActionNoiseL2Loss=0.1274 + throughput/total_tokens=458,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2388/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=458,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2389/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=458,688,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2390/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=458,880,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=2391/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=459,072,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2392/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=459,264,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2393/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=459,456,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2394/500000] + train/ActionNoiseL2Loss=0.0922 + throughput/total_tokens=459,648,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2395/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=459,840,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2396/500000] + train/ActionNoiseL2Loss=0.0992 + throughput/total_tokens=460,032,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2397/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=460,224,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2398/500000] + train/ActionNoiseL2Loss=0.1216 + throughput/total_tokens=460,416,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2399/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=460,608,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2400/500000] + optim/total_grad_norm=1.442 + train/ActionNoiseL2Loss=0.0962 + throughput/total_tokens=460,800,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=2401/500000] + train/ActionNoiseL2Loss=0.0945 + throughput/total_tokens=460,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2402/500000] + train/ActionNoiseL2Loss=0.1355 + throughput/total_tokens=461,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2403/500000] + train/ActionNoiseL2Loss=0.1073 + throughput/total_tokens=461,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2404/500000] + train/ActionNoiseL2Loss=0.1136 + throughput/total_tokens=461,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2405/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=461,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2406/500000] + train/ActionNoiseL2Loss=0.1052 + throughput/total_tokens=461,952,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2407/500000] + train/ActionNoiseL2Loss=0.1027 + throughput/total_tokens=462,144,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2408/500000] + train/ActionNoiseL2Loss=0.0946 + throughput/total_tokens=462,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2409/500000] + train/ActionNoiseL2Loss=0.0788 + throughput/total_tokens=462,528,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2410/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=462,720,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2411/500000] + train/ActionNoiseL2Loss=0.1366 + throughput/total_tokens=462,912,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2412/500000] + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=463,104,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2413/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=463,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2414/500000] + train/ActionNoiseL2Loss=0.0990 + throughput/total_tokens=463,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2415/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=463,680,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2416/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=463,872,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2417/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=464,064,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2418/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=464,256,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2419/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=464,448,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2420/500000] + optim/total_grad_norm=1.975 + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=464,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2421/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=464,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2422/500000] + train/ActionNoiseL2Loss=0.1110 + throughput/total_tokens=465,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2423/500000] + train/ActionNoiseL2Loss=0.1029 + throughput/total_tokens=465,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2424/500000] + train/ActionNoiseL2Loss=0.1176 + throughput/total_tokens=465,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2425/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=465,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2426/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=465,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2427/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=465,984,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2428/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=466,176,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2429/500000] + train/ActionNoiseL2Loss=0.1117 + throughput/total_tokens=466,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2430/500000] + train/ActionNoiseL2Loss=0.1894 + throughput/total_tokens=466,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2431/500000] + train/ActionNoiseL2Loss=0.1256 + throughput/total_tokens=466,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2432/500000] + train/ActionNoiseL2Loss=0.1047 + throughput/total_tokens=466,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2433/500000] + train/ActionNoiseL2Loss=0.1306 + throughput/total_tokens=467,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2434/500000] + train/ActionNoiseL2Loss=0.1017 + throughput/total_tokens=467,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2435/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=467,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2436/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=467,712,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2437/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=467,904,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2438/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=468,096,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2439/500000] + train/ActionNoiseL2Loss=0.1202 + throughput/total_tokens=468,288,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2440/500000] + optim/total_grad_norm=1.135 + train/ActionNoiseL2Loss=0.0881 + throughput/total_tokens=468,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2441/500000] + train/ActionNoiseL2Loss=0.0982 + throughput/total_tokens=468,672,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2442/500000] + train/ActionNoiseL2Loss=0.0931 + throughput/total_tokens=468,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2443/500000] + train/ActionNoiseL2Loss=0.0977 + throughput/total_tokens=469,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2444/500000] + train/ActionNoiseL2Loss=0.0946 + throughput/total_tokens=469,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2445/500000] + train/ActionNoiseL2Loss=0.0776 + throughput/total_tokens=469,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2446/500000] + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=469,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2447/500000] + train/ActionNoiseL2Loss=0.1368 + throughput/total_tokens=469,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2448/500000] + train/ActionNoiseL2Loss=0.1291 + throughput/total_tokens=470,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2449/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=470,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2450/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=470,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=2451/500000] + train/ActionNoiseL2Loss=0.1342 + throughput/total_tokens=470,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2452/500000] + train/ActionNoiseL2Loss=0.0971 + throughput/total_tokens=470,784,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2453/500000] + train/ActionNoiseL2Loss=0.1010 + throughput/total_tokens=470,976,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2454/500000] + train/ActionNoiseL2Loss=0.1023 + throughput/total_tokens=471,168,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2455/500000] + train/ActionNoiseL2Loss=0.1292 + throughput/total_tokens=471,360,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2456/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=471,552,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2457/500000] + train/ActionNoiseL2Loss=0.0956 + throughput/total_tokens=471,744,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2458/500000] + train/ActionNoiseL2Loss=0.1449 + throughput/total_tokens=471,936,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2459/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=472,128,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2460/500000] + optim/total_grad_norm=2.075 + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=472,320,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2461/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=472,512,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2462/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=472,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2463/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=472,896,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2464/500000] + train/ActionNoiseL2Loss=0.1589 + throughput/total_tokens=473,088,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2465/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=473,280,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2466/500000] + train/ActionNoiseL2Loss=0.1484 + throughput/total_tokens=473,472,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2467/500000] + train/ActionNoiseL2Loss=0.1249 + throughput/total_tokens=473,664,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2468/500000] + train/ActionNoiseL2Loss=0.1046 + throughput/total_tokens=473,856,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2469/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=474,048,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2470/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=474,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2471/500000] + train/ActionNoiseL2Loss=0.0888 + throughput/total_tokens=474,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2472/500000] + train/ActionNoiseL2Loss=0.0988 + throughput/total_tokens=474,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2473/500000] + train/ActionNoiseL2Loss=0.1255 + throughput/total_tokens=474,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2474/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=475,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2475/500000] + train/ActionNoiseL2Loss=0.1063 + throughput/total_tokens=475,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2476/500000] + train/ActionNoiseL2Loss=0.1184 + throughput/total_tokens=475,392,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2477/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=475,584,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2478/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=475,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2479/500000] + train/ActionNoiseL2Loss=0.1025 + throughput/total_tokens=475,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2480/500000] + optim/total_grad_norm=1.053 + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=476,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2481/500000] + train/ActionNoiseL2Loss=0.1237 + throughput/total_tokens=476,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2482/500000] + train/ActionNoiseL2Loss=0.0942 + throughput/total_tokens=476,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2483/500000] + train/ActionNoiseL2Loss=0.0916 + throughput/total_tokens=476,736,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2484/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=476,928,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2485/500000] + train/ActionNoiseL2Loss=0.0914 + throughput/total_tokens=477,120,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2486/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=477,312,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2487/500000] + train/ActionNoiseL2Loss=0.1026 + throughput/total_tokens=477,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2488/500000] + train/ActionNoiseL2Loss=0.0988 + throughput/total_tokens=477,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2489/500000] + train/ActionNoiseL2Loss=0.1115 + throughput/total_tokens=477,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2490/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=478,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2491/500000] + train/ActionNoiseL2Loss=0.1067 + throughput/total_tokens=478,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2492/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=478,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2493/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=478,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2494/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=478,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2495/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=479,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2496/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=479,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2497/500000] + train/ActionNoiseL2Loss=0.1051 + throughput/total_tokens=479,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2498/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=479,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2499/500000] + train/ActionNoiseL2Loss=0.1195 + throughput/total_tokens=479,808,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2500/500000] + optim/total_grad_norm=1.782 + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=480,000,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +10/12 [07:32:13] INFO | >> Saving config... checkpoint.py:608 +10/12 [07:32:46] INFO | >> Saving model state... checkpoint.py:796 +10/12 [07:33:58] INFO | >> Saving optim state... checkpoint.py:811 +10/12 [07:35:28] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=2501/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=480,192,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=2502/500000] + train/ActionNoiseL2Loss=0.1108 + throughput/total_tokens=480,384,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=2503/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=480,576,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0474 +[step=2504/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=480,768,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=2505/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=480,960,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=2506/500000] + train/ActionNoiseL2Loss=0.1168 + throughput/total_tokens=481,152,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=2507/500000] + train/ActionNoiseL2Loss=0.0946 + throughput/total_tokens=481,344,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=2508/500000] + train/ActionNoiseL2Loss=0.1086 + throughput/total_tokens=481,536,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2509/500000] + train/ActionNoiseL2Loss=0.1065 + throughput/total_tokens=481,728,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2510/500000] + train/ActionNoiseL2Loss=0.1105 + throughput/total_tokens=481,920,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2511/500000] + train/ActionNoiseL2Loss=0.0910 + throughput/total_tokens=482,112,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2512/500000] + train/ActionNoiseL2Loss=0.1316 + throughput/total_tokens=482,304,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2513/500000] + train/ActionNoiseL2Loss=0.1056 + throughput/total_tokens=482,496,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2514/500000] + train/ActionNoiseL2Loss=0.1254 + throughput/total_tokens=482,688,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2515/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=482,880,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2516/500000] + train/ActionNoiseL2Loss=0.1043 + throughput/total_tokens=483,072,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2517/500000] + train/ActionNoiseL2Loss=0.0826 + throughput/total_tokens=483,264,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2518/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=483,456,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2519/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=483,648,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2520/500000] + optim/total_grad_norm=1.324 + train/ActionNoiseL2Loss=0.0867 + throughput/total_tokens=483,840,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2521/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=484,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2522/500000] + train/ActionNoiseL2Loss=0.0990 + throughput/total_tokens=484,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2523/500000] + train/ActionNoiseL2Loss=0.1388 + throughput/total_tokens=484,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2524/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=484,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2525/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=484,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2526/500000] + train/ActionNoiseL2Loss=0.1054 + throughput/total_tokens=484,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2527/500000] + train/ActionNoiseL2Loss=0.1164 + throughput/total_tokens=485,184,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2528/500000] + train/ActionNoiseL2Loss=0.0950 + throughput/total_tokens=485,376,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2529/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=485,568,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2530/500000] + train/ActionNoiseL2Loss=0.0874 + throughput/total_tokens=485,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2531/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=485,952,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2532/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=486,144,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2533/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=486,336,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2534/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=486,528,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2535/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=486,720,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2536/500000] + train/ActionNoiseL2Loss=0.1077 + throughput/total_tokens=486,912,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2537/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=487,104,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2538/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=487,296,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2539/500000] + train/ActionNoiseL2Loss=0.0877 + throughput/total_tokens=487,488,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2540/500000] + optim/total_grad_norm=1.728 + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=487,680,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2541/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=487,872,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2542/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=488,064,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2543/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=488,256,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2544/500000] + train/ActionNoiseL2Loss=0.0877 + throughput/total_tokens=488,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2545/500000] + train/ActionNoiseL2Loss=0.1132 + throughput/total_tokens=488,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2546/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=488,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2547/500000] + train/ActionNoiseL2Loss=0.1023 + throughput/total_tokens=489,024,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2548/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=489,216,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2549/500000] + train/ActionNoiseL2Loss=0.1191 + throughput/total_tokens=489,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2550/500000] + train/ActionNoiseL2Loss=0.0836 + throughput/total_tokens=489,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2551/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=489,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2552/500000] + train/ActionNoiseL2Loss=0.1019 + throughput/total_tokens=489,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2553/500000] + train/ActionNoiseL2Loss=0.1399 + throughput/total_tokens=490,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2554/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=490,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2555/500000] + train/ActionNoiseL2Loss=0.0923 + throughput/total_tokens=490,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2556/500000] + train/ActionNoiseL2Loss=0.0827 + throughput/total_tokens=490,752,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2557/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=490,944,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2558/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=491,136,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2559/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=491,328,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2560/500000] + optim/total_grad_norm=1.218 + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=491,520,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=2561/500000] + train/ActionNoiseL2Loss=0.1034 + throughput/total_tokens=491,712,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2562/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=491,904,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2563/500000] + train/ActionNoiseL2Loss=0.0910 + throughput/total_tokens=492,096,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2564/500000] + train/ActionNoiseL2Loss=0.1250 + throughput/total_tokens=492,288,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2565/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=492,480,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2566/500000] + train/ActionNoiseL2Loss=0.1904 + throughput/total_tokens=492,672,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2567/500000] + train/ActionNoiseL2Loss=0.1181 + throughput/total_tokens=492,864,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2568/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=493,056,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2569/500000] + train/ActionNoiseL2Loss=0.1039 + throughput/total_tokens=493,248,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2570/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=493,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2571/500000] + train/ActionNoiseL2Loss=0.1044 + throughput/total_tokens=493,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2572/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=493,824,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2573/500000] + train/ActionNoiseL2Loss=0.1547 + throughput/total_tokens=494,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2574/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=494,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2575/500000] + train/ActionNoiseL2Loss=0.0888 + throughput/total_tokens=494,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2576/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=494,592,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2577/500000] + train/ActionNoiseL2Loss=0.0849 + throughput/total_tokens=494,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2578/500000] + train/ActionNoiseL2Loss=0.1169 + throughput/total_tokens=494,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2579/500000] + train/ActionNoiseL2Loss=0.1112 + throughput/total_tokens=495,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2580/500000] + optim/total_grad_norm=1.722 + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=495,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2581/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=495,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2582/500000] + train/ActionNoiseL2Loss=0.0845 + throughput/total_tokens=495,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2583/500000] + train/ActionNoiseL2Loss=0.0979 + throughput/total_tokens=495,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2584/500000] + train/ActionNoiseL2Loss=0.1046 + throughput/total_tokens=496,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2585/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=496,320,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2586/500000] + train/ActionNoiseL2Loss=0.1205 + throughput/total_tokens=496,512,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2587/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=496,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2588/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=496,896,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2589/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=497,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2590/500000] + train/ActionNoiseL2Loss=0.0918 + throughput/total_tokens=497,280,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2591/500000] + train/ActionNoiseL2Loss=0.1165 + throughput/total_tokens=497,472,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2592/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=497,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2593/500000] + train/ActionNoiseL2Loss=0.1154 + throughput/total_tokens=497,856,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2594/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=498,048,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2595/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=498,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2596/500000] + train/ActionNoiseL2Loss=0.1136 + throughput/total_tokens=498,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2597/500000] + train/ActionNoiseL2Loss=0.1162 + throughput/total_tokens=498,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2598/500000] + train/ActionNoiseL2Loss=0.1086 + throughput/total_tokens=498,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2599/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=499,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2600/500000] + optim/total_grad_norm=2.257 + train/ActionNoiseL2Loss=0.0970 + throughput/total_tokens=499,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2601/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=499,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2602/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=499,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2603/500000] + train/ActionNoiseL2Loss=0.1568 + throughput/total_tokens=499,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2604/500000] + train/ActionNoiseL2Loss=0.1151 + throughput/total_tokens=499,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2605/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=500,160,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2606/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=500,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2607/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=500,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2608/500000] + train/ActionNoiseL2Loss=0.0907 + throughput/total_tokens=500,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2609/500000] + train/ActionNoiseL2Loss=0.1372 + throughput/total_tokens=500,928,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2610/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=501,120,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2611/500000] + train/ActionNoiseL2Loss=0.1089 + throughput/total_tokens=501,312,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2612/500000] + train/ActionNoiseL2Loss=0.0906 + throughput/total_tokens=501,504,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2613/500000] + train/ActionNoiseL2Loss=0.1363 + throughput/total_tokens=501,696,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2614/500000] + train/ActionNoiseL2Loss=0.1561 + throughput/total_tokens=501,888,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2615/500000] + train/ActionNoiseL2Loss=0.1118 + throughput/total_tokens=502,080,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2616/500000] + train/ActionNoiseL2Loss=0.1080 + throughput/total_tokens=502,272,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2617/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=502,464,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2618/500000] + train/ActionNoiseL2Loss=0.1190 + throughput/total_tokens=502,656,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2619/500000] + train/ActionNoiseL2Loss=0.1055 + throughput/total_tokens=502,848,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2620/500000] + optim/total_grad_norm=1.736 + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=503,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=2621/500000] + train/ActionNoiseL2Loss=0.0970 + throughput/total_tokens=503,232,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2622/500000] + train/ActionNoiseL2Loss=0.0941 + throughput/total_tokens=503,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2623/500000] + train/ActionNoiseL2Loss=0.0824 + throughput/total_tokens=503,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2624/500000] + train/ActionNoiseL2Loss=0.0984 + throughput/total_tokens=503,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2625/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=504,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2626/500000] + train/ActionNoiseL2Loss=0.0970 + throughput/total_tokens=504,192,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2627/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=504,384,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2628/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=504,576,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2629/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=504,768,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2630/500000] + train/ActionNoiseL2Loss=0.0941 + throughput/total_tokens=504,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=2631/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=505,152,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2632/500000] + train/ActionNoiseL2Loss=0.1269 + throughput/total_tokens=505,344,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2633/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=505,536,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2634/500000] + train/ActionNoiseL2Loss=0.1074 + throughput/total_tokens=505,728,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2635/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=505,920,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2636/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=506,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2637/500000] + train/ActionNoiseL2Loss=0.1006 + throughput/total_tokens=506,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2638/500000] + train/ActionNoiseL2Loss=0.1045 + throughput/total_tokens=506,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2639/500000] + train/ActionNoiseL2Loss=0.1392 + throughput/total_tokens=506,688,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2640/500000] + optim/total_grad_norm=1.704 + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=506,880,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=2641/500000] + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=507,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2642/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=507,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2643/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=507,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2644/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=507,648,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2645/500000] + train/ActionNoiseL2Loss=0.1127 + throughput/total_tokens=507,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2646/500000] + train/ActionNoiseL2Loss=0.0914 + throughput/total_tokens=508,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2647/500000] + train/ActionNoiseL2Loss=0.0894 + throughput/total_tokens=508,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2648/500000] + train/ActionNoiseL2Loss=0.0893 + throughput/total_tokens=508,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2649/500000] + train/ActionNoiseL2Loss=0.1116 + throughput/total_tokens=508,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2650/500000] + train/ActionNoiseL2Loss=0.0991 + throughput/total_tokens=508,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2651/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=508,992,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2652/500000] + train/ActionNoiseL2Loss=0.1375 + throughput/total_tokens=509,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2653/500000] + train/ActionNoiseL2Loss=0.0892 + throughput/total_tokens=509,376,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2654/500000] + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=509,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2655/500000] + train/ActionNoiseL2Loss=0.1367 + throughput/total_tokens=509,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2656/500000] + train/ActionNoiseL2Loss=0.1059 + throughput/total_tokens=509,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2657/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=510,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2658/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=510,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2659/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=510,528,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2660/500000] + optim/total_grad_norm=1.296 + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=510,720,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2661/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=510,912,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2662/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=511,104,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2663/500000] + train/ActionNoiseL2Loss=0.0905 + throughput/total_tokens=511,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2664/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=511,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2665/500000] + train/ActionNoiseL2Loss=0.0950 + throughput/total_tokens=511,680,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2666/500000] + train/ActionNoiseL2Loss=0.1080 + throughput/total_tokens=511,872,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2667/500000] + train/ActionNoiseL2Loss=0.0986 + throughput/total_tokens=512,064,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2668/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=512,256,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2669/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=512,448,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2670/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=512,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2671/500000] + train/ActionNoiseL2Loss=0.1032 + throughput/total_tokens=512,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2672/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=513,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2673/500000] + train/ActionNoiseL2Loss=0.1433 + throughput/total_tokens=513,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2674/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=513,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2675/500000] + train/ActionNoiseL2Loss=0.0986 + throughput/total_tokens=513,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2676/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=513,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2677/500000] + train/ActionNoiseL2Loss=0.0858 + throughput/total_tokens=513,984,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2678/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=514,176,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2679/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=514,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2680/500000] + optim/total_grad_norm=1.828 + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=514,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2681/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=514,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2682/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=514,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2683/500000] + train/ActionNoiseL2Loss=0.0339 + throughput/total_tokens=515,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2684/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=515,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2685/500000] + train/ActionNoiseL2Loss=0.1296 + throughput/total_tokens=515,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2686/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=515,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2687/500000] + train/ActionNoiseL2Loss=0.0840 + throughput/total_tokens=515,904,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2688/500000] + train/ActionNoiseL2Loss=0.0962 + throughput/total_tokens=516,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2689/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=516,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2690/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=516,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2691/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=516,672,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2692/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=516,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2693/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=517,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2694/500000] + train/ActionNoiseL2Loss=0.1061 + throughput/total_tokens=517,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2695/500000] + train/ActionNoiseL2Loss=0.0978 + throughput/total_tokens=517,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2696/500000] + train/ActionNoiseL2Loss=0.1564 + throughput/total_tokens=517,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2697/500000] + train/ActionNoiseL2Loss=0.0972 + throughput/total_tokens=517,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2698/500000] + train/ActionNoiseL2Loss=0.0973 + throughput/total_tokens=518,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2699/500000] + train/ActionNoiseL2Loss=0.1000 + throughput/total_tokens=518,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2700/500000] + optim/total_grad_norm=1.308 + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=518,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2701/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=518,592,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2702/500000] + train/ActionNoiseL2Loss=0.0926 + throughput/total_tokens=518,784,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2703/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=518,976,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2704/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=519,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2705/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=519,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2706/500000] + train/ActionNoiseL2Loss=0.1025 + throughput/total_tokens=519,552,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2707/500000] + train/ActionNoiseL2Loss=0.1075 + throughput/total_tokens=519,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2708/500000] + train/ActionNoiseL2Loss=0.1056 + throughput/total_tokens=519,936,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2709/500000] + train/ActionNoiseL2Loss=0.0993 + throughput/total_tokens=520,128,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2710/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=520,320,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2711/500000] + train/ActionNoiseL2Loss=0.1144 + throughput/total_tokens=520,512,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2712/500000] + train/ActionNoiseL2Loss=0.1579 + throughput/total_tokens=520,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2713/500000] + train/ActionNoiseL2Loss=0.1403 + throughput/total_tokens=520,896,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2714/500000] + train/ActionNoiseL2Loss=0.1628 + throughput/total_tokens=521,088,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2715/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=521,280,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2716/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=521,472,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2717/500000] + train/ActionNoiseL2Loss=0.0888 + throughput/total_tokens=521,664,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2718/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=521,856,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2719/500000] + train/ActionNoiseL2Loss=0.1054 + throughput/total_tokens=522,048,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2720/500000] + optim/total_grad_norm=1.756 + train/ActionNoiseL2Loss=0.1684 + throughput/total_tokens=522,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2721/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=522,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2722/500000] + train/ActionNoiseL2Loss=0.1239 + throughput/total_tokens=522,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2723/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=522,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2724/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=523,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2725/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=523,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2726/500000] + train/ActionNoiseL2Loss=0.1122 + throughput/total_tokens=523,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2727/500000] + train/ActionNoiseL2Loss=0.1040 + throughput/total_tokens=523,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2728/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=523,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2729/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=523,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2730/500000] + train/ActionNoiseL2Loss=0.1449 + throughput/total_tokens=524,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2731/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=524,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2732/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=524,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2733/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=524,736,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2734/500000] + train/ActionNoiseL2Loss=0.1420 + throughput/total_tokens=524,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2735/500000] + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=525,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2736/500000] + train/ActionNoiseL2Loss=0.1051 + throughput/total_tokens=525,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2737/500000] + train/ActionNoiseL2Loss=0.0954 + throughput/total_tokens=525,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2738/500000] + train/ActionNoiseL2Loss=0.0898 + throughput/total_tokens=525,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2739/500000] + train/ActionNoiseL2Loss=0.1253 + throughput/total_tokens=525,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2740/500000] + optim/total_grad_norm=1.176 + train/ActionNoiseL2Loss=0.0747 + throughput/total_tokens=526,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2741/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=526,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2742/500000] + train/ActionNoiseL2Loss=0.0863 + throughput/total_tokens=526,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2743/500000] + train/ActionNoiseL2Loss=0.1221 + throughput/total_tokens=526,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2744/500000] + train/ActionNoiseL2Loss=0.1233 + throughput/total_tokens=526,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2745/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=527,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2746/500000] + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=527,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2747/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=527,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2748/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=527,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2749/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=527,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2750/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=528,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2751/500000] + train/ActionNoiseL2Loss=0.0926 + throughput/total_tokens=528,192,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2752/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=528,384,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2753/500000] + train/ActionNoiseL2Loss=0.0996 + throughput/total_tokens=528,576,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2754/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=528,768,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=2755/500000] + train/ActionNoiseL2Loss=0.0930 + throughput/total_tokens=528,960,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=2756/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=529,152,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=2757/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=529,344,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=2758/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=529,536,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=2759/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=529,728,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=2760/500000] + optim/total_grad_norm=1.646 + train/ActionNoiseL2Loss=0.1141 + throughput/total_tokens=529,920,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=2761/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=530,112,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=2762/500000] + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=530,304,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=2763/500000] + train/ActionNoiseL2Loss=0.1587 + throughput/total_tokens=530,496,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=2764/500000] + train/ActionNoiseL2Loss=0.0865 + throughput/total_tokens=530,688,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=2765/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=530,880,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=2766/500000] + train/ActionNoiseL2Loss=0.1287 + throughput/total_tokens=531,072,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=2767/500000] + train/ActionNoiseL2Loss=0.1034 + throughput/total_tokens=531,264,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=2768/500000] + train/ActionNoiseL2Loss=0.0898 + throughput/total_tokens=531,456,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=2769/500000] + train/ActionNoiseL2Loss=0.0878 + throughput/total_tokens=531,648,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=2770/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=531,840,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2771/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=532,032,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2772/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=532,224,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2773/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=532,416,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2774/500000] + train/ActionNoiseL2Loss=0.1251 + throughput/total_tokens=532,608,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2775/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=532,800,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2776/500000] + train/ActionNoiseL2Loss=0.1088 + throughput/total_tokens=532,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2777/500000] + train/ActionNoiseL2Loss=0.1022 + throughput/total_tokens=533,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2778/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=533,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2779/500000] + train/ActionNoiseL2Loss=0.1178 + throughput/total_tokens=533,568,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2780/500000] + optim/total_grad_norm=1.758 + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=533,760,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2781/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=533,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2782/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=534,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2783/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=534,336,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2784/500000] + train/ActionNoiseL2Loss=0.0893 + throughput/total_tokens=534,528,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2785/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=534,720,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2786/500000] + train/ActionNoiseL2Loss=0.1208 + throughput/total_tokens=534,912,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2787/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=535,104,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2788/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=535,296,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2789/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=535,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2790/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=535,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2791/500000] + train/ActionNoiseL2Loss=0.1234 + throughput/total_tokens=535,872,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2792/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=536,064,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2793/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=536,256,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2794/500000] + train/ActionNoiseL2Loss=0.0900 + throughput/total_tokens=536,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2795/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=536,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2796/500000] + train/ActionNoiseL2Loss=0.1043 + throughput/total_tokens=536,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2797/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=537,024,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2798/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=537,216,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2799/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=537,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2800/500000] + optim/total_grad_norm=1.744 + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=537,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2801/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=537,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2802/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=537,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2803/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=538,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2804/500000] + train/ActionNoiseL2Loss=0.0888 + throughput/total_tokens=538,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2805/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=538,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2806/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=538,752,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2807/500000] + train/ActionNoiseL2Loss=0.0884 + throughput/total_tokens=538,944,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2808/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=539,136,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2809/500000] + train/ActionNoiseL2Loss=0.1043 + throughput/total_tokens=539,328,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2810/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=539,520,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2811/500000] + train/ActionNoiseL2Loss=0.1200 + throughput/total_tokens=539,712,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2812/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=539,904,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2813/500000] + train/ActionNoiseL2Loss=0.1216 + throughput/total_tokens=540,096,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2814/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=540,288,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2815/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=540,480,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2816/500000] + train/ActionNoiseL2Loss=0.1361 + throughput/total_tokens=540,672,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2817/500000] + train/ActionNoiseL2Loss=0.1404 + throughput/total_tokens=540,864,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2818/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=541,056,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2819/500000] + train/ActionNoiseL2Loss=0.0923 + throughput/total_tokens=541,248,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2820/500000] + optim/total_grad_norm=0.9401 + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=541,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=2821/500000] + train/ActionNoiseL2Loss=0.1413 + throughput/total_tokens=541,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2822/500000] + train/ActionNoiseL2Loss=0.1056 + throughput/total_tokens=541,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2823/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=542,016,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=2824/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=542,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2825/500000] + train/ActionNoiseL2Loss=0.1580 + throughput/total_tokens=542,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2826/500000] + train/ActionNoiseL2Loss=0.1070 + throughput/total_tokens=542,592,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2827/500000] + train/ActionNoiseL2Loss=0.1428 + throughput/total_tokens=542,784,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2828/500000] + train/ActionNoiseL2Loss=0.0886 + throughput/total_tokens=542,976,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2829/500000] + train/ActionNoiseL2Loss=0.1700 + throughput/total_tokens=543,168,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2830/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=543,360,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=2831/500000] + train/ActionNoiseL2Loss=0.1304 + throughput/total_tokens=543,552,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2832/500000] + train/ActionNoiseL2Loss=0.1006 + throughput/total_tokens=543,744,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2833/500000] + train/ActionNoiseL2Loss=0.1103 + throughput/total_tokens=543,936,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2834/500000] + train/ActionNoiseL2Loss=0.1587 + throughput/total_tokens=544,128,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2835/500000] + train/ActionNoiseL2Loss=0.0958 + throughput/total_tokens=544,320,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2836/500000] + train/ActionNoiseL2Loss=0.1369 + throughput/total_tokens=544,512,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2837/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=544,704,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2838/500000] + train/ActionNoiseL2Loss=0.1158 + throughput/total_tokens=544,896,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2839/500000] + train/ActionNoiseL2Loss=0.1107 + throughput/total_tokens=545,088,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2840/500000] + optim/total_grad_norm=2.050 + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=545,280,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=2841/500000] + train/ActionNoiseL2Loss=0.1117 + throughput/total_tokens=545,472,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2842/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=545,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2843/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=545,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2844/500000] + train/ActionNoiseL2Loss=0.1036 + throughput/total_tokens=546,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2845/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=546,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2846/500000] + train/ActionNoiseL2Loss=0.0868 + throughput/total_tokens=546,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2847/500000] + train/ActionNoiseL2Loss=0.0903 + throughput/total_tokens=546,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2848/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=546,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2849/500000] + train/ActionNoiseL2Loss=0.1645 + throughput/total_tokens=547,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2850/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=547,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2851/500000] + train/ActionNoiseL2Loss=0.0972 + throughput/total_tokens=547,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2852/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=547,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2853/500000] + train/ActionNoiseL2Loss=0.1243 + throughput/total_tokens=547,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2854/500000] + train/ActionNoiseL2Loss=0.0989 + throughput/total_tokens=547,968,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2855/500000] + train/ActionNoiseL2Loss=0.0790 + throughput/total_tokens=548,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2856/500000] + train/ActionNoiseL2Loss=0.1257 + throughput/total_tokens=548,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2857/500000] + train/ActionNoiseL2Loss=0.1018 + throughput/total_tokens=548,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2858/500000] + train/ActionNoiseL2Loss=0.1171 + throughput/total_tokens=548,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2859/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=548,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2860/500000] + optim/total_grad_norm=1.486 + train/ActionNoiseL2Loss=0.1121 + throughput/total_tokens=549,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2861/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=549,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2862/500000] + train/ActionNoiseL2Loss=0.0945 + throughput/total_tokens=549,504,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2863/500000] + train/ActionNoiseL2Loss=0.0931 + throughput/total_tokens=549,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2864/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=549,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2865/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=550,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2866/500000] + train/ActionNoiseL2Loss=0.0959 + throughput/total_tokens=550,272,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2867/500000] + train/ActionNoiseL2Loss=0.0892 + throughput/total_tokens=550,464,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2868/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=550,656,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2869/500000] + train/ActionNoiseL2Loss=0.1447 + throughput/total_tokens=550,848,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2870/500000] + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=551,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2871/500000] + train/ActionNoiseL2Loss=0.0926 + throughput/total_tokens=551,232,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2872/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=551,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2873/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=551,616,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2874/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=551,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2875/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=552,000,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2876/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=552,192,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2877/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=552,384,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2878/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=552,576,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2879/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=552,768,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2880/500000] + optim/total_grad_norm=0.8975 + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=552,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2881/500000] + train/ActionNoiseL2Loss=0.0981 + throughput/total_tokens=553,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2882/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=553,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2883/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=553,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2884/500000] + train/ActionNoiseL2Loss=0.0709 + throughput/total_tokens=553,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2885/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=553,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2886/500000] + train/ActionNoiseL2Loss=0.0977 + throughput/total_tokens=554,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2887/500000] + train/ActionNoiseL2Loss=0.0947 + throughput/total_tokens=554,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2888/500000] + train/ActionNoiseL2Loss=0.1446 + throughput/total_tokens=554,496,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2889/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=554,688,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2890/500000] + train/ActionNoiseL2Loss=0.0802 + throughput/total_tokens=554,880,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2891/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=555,072,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2892/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=555,264,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2893/500000] + train/ActionNoiseL2Loss=0.0915 + throughput/total_tokens=555,456,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2894/500000] + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=555,648,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2895/500000] + train/ActionNoiseL2Loss=0.0888 + throughput/total_tokens=555,840,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2896/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=556,032,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2897/500000] + train/ActionNoiseL2Loss=0.1345 + throughput/total_tokens=556,224,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2898/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=556,416,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2899/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=556,608,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2900/500000] + optim/total_grad_norm=1.415 + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=556,800,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2901/500000] + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=556,992,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2902/500000] + train/ActionNoiseL2Loss=0.1123 + throughput/total_tokens=557,184,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2903/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=557,376,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=2904/500000] + train/ActionNoiseL2Loss=0.0865 + throughput/total_tokens=557,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2905/500000] + train/ActionNoiseL2Loss=0.1478 + throughput/total_tokens=557,760,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2906/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=557,952,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2907/500000] + train/ActionNoiseL2Loss=0.1078 + throughput/total_tokens=558,144,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2908/500000] + train/ActionNoiseL2Loss=0.1030 + throughput/total_tokens=558,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2909/500000] + train/ActionNoiseL2Loss=0.1097 + throughput/total_tokens=558,528,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2910/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=558,720,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=2911/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=558,912,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2912/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=559,104,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2913/500000] + train/ActionNoiseL2Loss=0.1209 + throughput/total_tokens=559,296,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2914/500000] + train/ActionNoiseL2Loss=0.1288 + throughput/total_tokens=559,488,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2915/500000] + train/ActionNoiseL2Loss=0.1116 + throughput/total_tokens=559,680,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2916/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=559,872,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2917/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=560,064,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=2918/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=560,256,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2919/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=560,448,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=2920/500000] + optim/total_grad_norm=1.433 + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=560,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2921/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=560,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2922/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=561,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2923/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=561,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2924/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=561,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2925/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=561,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2926/500000] + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=561,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2927/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=561,984,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2928/500000] + train/ActionNoiseL2Loss=0.0962 + throughput/total_tokens=562,176,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2929/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=562,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2930/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=562,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2931/500000] + train/ActionNoiseL2Loss=0.0896 + throughput/total_tokens=562,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2932/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=562,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2933/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=563,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2934/500000] + train/ActionNoiseL2Loss=0.1218 + throughput/total_tokens=563,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2935/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=563,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2936/500000] + train/ActionNoiseL2Loss=0.1417 + throughput/total_tokens=563,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2937/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=563,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2938/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=564,096,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2939/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=564,288,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2940/500000] + optim/total_grad_norm=1.404 + train/ActionNoiseL2Loss=0.0995 + throughput/total_tokens=564,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2941/500000] + train/ActionNoiseL2Loss=0.1632 + throughput/total_tokens=564,672,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2942/500000] + train/ActionNoiseL2Loss=0.1042 + throughput/total_tokens=564,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2943/500000] + train/ActionNoiseL2Loss=0.0849 + throughput/total_tokens=565,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2944/500000] + train/ActionNoiseL2Loss=0.0838 + throughput/total_tokens=565,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2945/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=565,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2946/500000] + train/ActionNoiseL2Loss=0.1255 + throughput/total_tokens=565,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2947/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=565,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2948/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=566,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=2949/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=566,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=2950/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=566,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2951/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=566,592,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=2952/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=566,784,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=2953/500000] + train/ActionNoiseL2Loss=0.0785 + throughput/total_tokens=566,976,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=2954/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=567,168,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=2955/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=567,360,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=2956/500000] + train/ActionNoiseL2Loss=0.0851 + throughput/total_tokens=567,552,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=2957/500000] + train/ActionNoiseL2Loss=0.0977 + throughput/total_tokens=567,744,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=2958/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=567,936,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=2959/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=568,128,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=2960/500000] + optim/total_grad_norm=1.009 + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=568,320,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 + System/Peak GPU Memory (MB)=51,076 +[step=2961/500000] + train/ActionNoiseL2Loss=0.1027 + throughput/total_tokens=568,512,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=2962/500000] + train/ActionNoiseL2Loss=0.1170 + throughput/total_tokens=568,704,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=2963/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=568,896,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=2964/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=569,088,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=2965/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=569,280,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=2966/500000] + train/ActionNoiseL2Loss=0.1008 + throughput/total_tokens=569,472,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=2967/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=569,664,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=2968/500000] + train/ActionNoiseL2Loss=0.1105 + throughput/total_tokens=569,856,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=2969/500000] + train/ActionNoiseL2Loss=0.1286 + throughput/total_tokens=570,048,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=2970/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=570,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2971/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=570,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=2972/500000] + train/ActionNoiseL2Loss=0.1239 + throughput/total_tokens=570,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2973/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=570,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2974/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=571,008,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2975/500000] + train/ActionNoiseL2Loss=0.0919 + throughput/total_tokens=571,200,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2976/500000] + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=571,392,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2977/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=571,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2978/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=571,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2979/500000] + train/ActionNoiseL2Loss=0.0955 + throughput/total_tokens=571,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2980/500000] + optim/total_grad_norm=1.508 + train/ActionNoiseL2Loss=0.1134 + throughput/total_tokens=572,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2981/500000] + train/ActionNoiseL2Loss=0.1156 + throughput/total_tokens=572,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2982/500000] + train/ActionNoiseL2Loss=0.0843 + throughput/total_tokens=572,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2983/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=572,736,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2984/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=572,928,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2985/500000] + train/ActionNoiseL2Loss=0.1345 + throughput/total_tokens=573,120,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2986/500000] + train/ActionNoiseL2Loss=0.1229 + throughput/total_tokens=573,312,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2987/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=573,504,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2988/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=573,696,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2989/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=573,888,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2990/500000] + train/ActionNoiseL2Loss=0.1019 + throughput/total_tokens=574,080,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=2991/500000] + train/ActionNoiseL2Loss=0.1211 + throughput/total_tokens=574,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2992/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=574,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2993/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=574,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=2994/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=574,848,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2995/500000] + train/ActionNoiseL2Loss=0.0853 + throughput/total_tokens=575,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=2996/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=575,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2997/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=575,424,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2998/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=575,616,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=2999/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=575,808,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3000/500000] + optim/total_grad_norm=2.332 + train/ActionNoiseL2Loss=0.1312 + throughput/total_tokens=576,000,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +10/12 [10:31:32] INFO | >> Saving config... checkpoint.py:608 +10/12 [10:32:04] INFO | >> Saving model state... checkpoint.py:796 +10/12 [10:33:21] INFO | >> Saving optim state... checkpoint.py:811 +10/12 [10:34:54] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=3001/500000] + train/ActionNoiseL2Loss=0.0878 + throughput/total_tokens=576,192,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=3002/500000] + train/ActionNoiseL2Loss=0.0752 + throughput/total_tokens=576,384,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=3003/500000] + train/ActionNoiseL2Loss=0.0838 + throughput/total_tokens=576,576,000 + throughput/device/tokens_per_second=1,117 + throughput/device/batches_per_second=0.0465 +[step=3004/500000] + train/ActionNoiseL2Loss=0.0971 + throughput/total_tokens=576,768,000 + throughput/device/tokens_per_second=1,124 + throughput/device/batches_per_second=0.0469 +[step=3005/500000] + train/ActionNoiseL2Loss=0.1098 + throughput/total_tokens=576,960,000 + throughput/device/tokens_per_second=1,130 + throughput/device/batches_per_second=0.0471 +[step=3006/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=577,152,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=3007/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=577,344,000 + throughput/device/tokens_per_second=1,136 + throughput/device/batches_per_second=0.0474 +[step=3008/500000] + train/ActionNoiseL2Loss=0.1046 + throughput/total_tokens=577,536,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0475 +[step=3009/500000] + train/ActionNoiseL2Loss=0.1060 + throughput/total_tokens=577,728,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=3010/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=577,920,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 + System/Peak GPU Memory (MB)=51,076 +[step=3011/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=578,112,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=3012/500000] + train/ActionNoiseL2Loss=0.1378 + throughput/total_tokens=578,304,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=3013/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=578,496,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=3014/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=578,688,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=3015/500000] + train/ActionNoiseL2Loss=0.1108 + throughput/total_tokens=578,880,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=3016/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=579,072,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3017/500000] + train/ActionNoiseL2Loss=0.1096 + throughput/total_tokens=579,264,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3018/500000] + train/ActionNoiseL2Loss=0.0826 + throughput/total_tokens=579,456,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3019/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=579,648,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3020/500000] + optim/total_grad_norm=2.184 + train/ActionNoiseL2Loss=0.0945 + throughput/total_tokens=579,840,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=3021/500000] + train/ActionNoiseL2Loss=0.1065 + throughput/total_tokens=580,032,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3022/500000] + train/ActionNoiseL2Loss=0.0792 + throughput/total_tokens=580,224,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3023/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=580,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3024/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=580,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3025/500000] + train/ActionNoiseL2Loss=0.1186 + throughput/total_tokens=580,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3026/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=580,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3027/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=581,184,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3028/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=581,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3029/500000] + train/ActionNoiseL2Loss=0.0849 + throughput/total_tokens=581,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3030/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=581,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3031/500000] + train/ActionNoiseL2Loss=0.0950 + throughput/total_tokens=581,952,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3032/500000] + train/ActionNoiseL2Loss=0.0936 + throughput/total_tokens=582,144,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3033/500000] + train/ActionNoiseL2Loss=0.0927 + throughput/total_tokens=582,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3034/500000] + train/ActionNoiseL2Loss=0.1048 + throughput/total_tokens=582,528,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3035/500000] + train/ActionNoiseL2Loss=0.1216 + throughput/total_tokens=582,720,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3036/500000] + train/ActionNoiseL2Loss=0.1095 + throughput/total_tokens=582,912,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3037/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=583,104,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3038/500000] + train/ActionNoiseL2Loss=0.1047 + throughput/total_tokens=583,296,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3039/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=583,488,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3040/500000] + optim/total_grad_norm=1.338 + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=583,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3041/500000] + train/ActionNoiseL2Loss=0.1238 + throughput/total_tokens=583,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3042/500000] + train/ActionNoiseL2Loss=0.0788 + throughput/total_tokens=584,064,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3043/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=584,256,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3044/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=584,448,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3045/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=584,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3046/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=584,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3047/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=585,024,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3048/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=585,216,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3049/500000] + train/ActionNoiseL2Loss=0.0874 + throughput/total_tokens=585,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3050/500000] + train/ActionNoiseL2Loss=0.0909 + throughput/total_tokens=585,600,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3051/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=585,792,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3052/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=585,984,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3053/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=586,176,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3054/500000] + train/ActionNoiseL2Loss=0.0903 + throughput/total_tokens=586,368,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3055/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=586,560,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3056/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=586,752,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3057/500000] + train/ActionNoiseL2Loss=0.0709 + throughput/total_tokens=586,944,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3058/500000] + train/ActionNoiseL2Loss=0.0788 + throughput/total_tokens=587,136,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3059/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=587,328,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3060/500000] + optim/total_grad_norm=1.479 + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=587,520,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=3061/500000] + train/ActionNoiseL2Loss=0.1258 + throughput/total_tokens=587,712,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3062/500000] + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=587,904,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3063/500000] + train/ActionNoiseL2Loss=0.1236 + throughput/total_tokens=588,096,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3064/500000] + train/ActionNoiseL2Loss=0.0927 + throughput/total_tokens=588,288,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3065/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=588,480,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3066/500000] + train/ActionNoiseL2Loss=0.1562 + throughput/total_tokens=588,672,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3067/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=588,864,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3068/500000] + train/ActionNoiseL2Loss=0.0924 + throughput/total_tokens=589,056,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3069/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=589,248,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3070/500000] + train/ActionNoiseL2Loss=0.1154 + throughput/total_tokens=589,440,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3071/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=589,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3072/500000] + train/ActionNoiseL2Loss=0.0973 + throughput/total_tokens=589,824,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3073/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=590,016,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3074/500000] + train/ActionNoiseL2Loss=0.1494 + throughput/total_tokens=590,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3075/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=590,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3076/500000] + train/ActionNoiseL2Loss=0.0966 + throughput/total_tokens=590,592,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3077/500000] + train/ActionNoiseL2Loss=0.0709 + throughput/total_tokens=590,784,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3078/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=590,976,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3079/500000] + train/ActionNoiseL2Loss=0.0907 + throughput/total_tokens=591,168,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3080/500000] + optim/total_grad_norm=1.361 + train/ActionNoiseL2Loss=0.0826 + throughput/total_tokens=591,360,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3081/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=591,552,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3082/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=591,744,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3083/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=591,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3084/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=592,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3085/500000] + train/ActionNoiseL2Loss=0.1383 + throughput/total_tokens=592,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3086/500000] + train/ActionNoiseL2Loss=0.0987 + throughput/total_tokens=592,512,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3087/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=592,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3088/500000] + train/ActionNoiseL2Loss=0.1002 + throughput/total_tokens=592,896,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3089/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=593,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3090/500000] + train/ActionNoiseL2Loss=0.0963 + throughput/total_tokens=593,280,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3091/500000] + train/ActionNoiseL2Loss=0.1493 + throughput/total_tokens=593,472,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3092/500000] + train/ActionNoiseL2Loss=0.1445 + throughput/total_tokens=593,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3093/500000] + train/ActionNoiseL2Loss=0.1067 + throughput/total_tokens=593,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3094/500000] + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=594,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3095/500000] + train/ActionNoiseL2Loss=0.0925 + throughput/total_tokens=594,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3096/500000] + train/ActionNoiseL2Loss=0.0894 + throughput/total_tokens=594,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3097/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=594,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3098/500000] + train/ActionNoiseL2Loss=0.1385 + throughput/total_tokens=594,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3099/500000] + train/ActionNoiseL2Loss=0.1284 + throughput/total_tokens=595,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3100/500000] + optim/total_grad_norm=1.066 + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=595,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=3101/500000] + train/ActionNoiseL2Loss=0.1337 + throughput/total_tokens=595,392,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3102/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=595,584,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3103/500000] + train/ActionNoiseL2Loss=0.1209 + throughput/total_tokens=595,776,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3104/500000] + train/ActionNoiseL2Loss=0.1088 + throughput/total_tokens=595,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3105/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=596,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3106/500000] + train/ActionNoiseL2Loss=0.1252 + throughput/total_tokens=596,352,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3107/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=596,544,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3108/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=596,736,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3109/500000] + train/ActionNoiseL2Loss=0.0818 + throughput/total_tokens=596,928,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3110/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=597,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3111/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=597,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3112/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=597,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3113/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=597,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3114/500000] + train/ActionNoiseL2Loss=0.1083 + throughput/total_tokens=597,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3115/500000] + train/ActionNoiseL2Loss=0.0878 + throughput/total_tokens=598,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3116/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=598,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3117/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=598,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3118/500000] + train/ActionNoiseL2Loss=0.0809 + throughput/total_tokens=598,656,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3119/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=598,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3120/500000] + optim/total_grad_norm=1.168 + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=599,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3121/500000] + train/ActionNoiseL2Loss=0.1021 + throughput/total_tokens=599,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3122/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=599,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3123/500000] + train/ActionNoiseL2Loss=0.0973 + throughput/total_tokens=599,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3124/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=599,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3125/500000] + train/ActionNoiseL2Loss=0.1136 + throughput/total_tokens=600,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3126/500000] + train/ActionNoiseL2Loss=0.0992 + throughput/total_tokens=600,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3127/500000] + train/ActionNoiseL2Loss=0.1074 + throughput/total_tokens=600,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3128/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=600,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3129/500000] + train/ActionNoiseL2Loss=0.1091 + throughput/total_tokens=600,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3130/500000] + train/ActionNoiseL2Loss=0.1359 + throughput/total_tokens=600,960,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3131/500000] + train/ActionNoiseL2Loss=0.0894 + throughput/total_tokens=601,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3132/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=601,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3133/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=601,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3134/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=601,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3135/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=601,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3136/500000] + train/ActionNoiseL2Loss=0.0387 + throughput/total_tokens=602,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3137/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=602,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3138/500000] + train/ActionNoiseL2Loss=0.1381 + throughput/total_tokens=602,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3139/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=602,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3140/500000] + optim/total_grad_norm=1.407 + train/ActionNoiseL2Loss=0.1139 + throughput/total_tokens=602,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3141/500000] + train/ActionNoiseL2Loss=0.1057 + throughput/total_tokens=603,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3142/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=603,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3143/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=603,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3144/500000] + train/ActionNoiseL2Loss=0.0971 + throughput/total_tokens=603,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3145/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=603,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3146/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=604,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3147/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=604,224,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3148/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=604,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3149/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=604,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3150/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=604,800,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3151/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=604,992,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3152/500000] + train/ActionNoiseL2Loss=0.1161 + throughput/total_tokens=605,184,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3153/500000] + train/ActionNoiseL2Loss=0.1448 + throughput/total_tokens=605,376,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3154/500000] + train/ActionNoiseL2Loss=0.0956 + throughput/total_tokens=605,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3155/500000] + train/ActionNoiseL2Loss=0.0944 + throughput/total_tokens=605,760,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3156/500000] + train/ActionNoiseL2Loss=0.0809 + throughput/total_tokens=605,952,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3157/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=606,144,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3158/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=606,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3159/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=606,528,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3160/500000] + optim/total_grad_norm=1.346 + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=606,720,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3161/500000] + train/ActionNoiseL2Loss=0.1164 + throughput/total_tokens=606,912,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3162/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=607,104,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3163/500000] + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=607,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3164/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=607,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3165/500000] + train/ActionNoiseL2Loss=0.0989 + throughput/total_tokens=607,680,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3166/500000] + train/ActionNoiseL2Loss=0.0999 + throughput/total_tokens=607,872,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3167/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=608,064,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3168/500000] + train/ActionNoiseL2Loss=0.1452 + throughput/total_tokens=608,256,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3169/500000] + train/ActionNoiseL2Loss=0.0886 + throughput/total_tokens=608,448,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3170/500000] + train/ActionNoiseL2Loss=0.1114 + throughput/total_tokens=608,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3171/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=608,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3172/500000] + train/ActionNoiseL2Loss=0.1063 + throughput/total_tokens=609,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3173/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=609,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3174/500000] + train/ActionNoiseL2Loss=0.1067 + throughput/total_tokens=609,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3175/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=609,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3176/500000] + train/ActionNoiseL2Loss=0.1163 + throughput/total_tokens=609,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3177/500000] + train/ActionNoiseL2Loss=0.0820 + throughput/total_tokens=609,984,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3178/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=610,176,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3179/500000] + train/ActionNoiseL2Loss=0.1065 + throughput/total_tokens=610,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3180/500000] + optim/total_grad_norm=1.821 + train/ActionNoiseL2Loss=0.0955 + throughput/total_tokens=610,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3181/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=610,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3182/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=610,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3183/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=611,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3184/500000] + train/ActionNoiseL2Loss=0.1232 + throughput/total_tokens=611,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3185/500000] + train/ActionNoiseL2Loss=0.1077 + throughput/total_tokens=611,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3186/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=611,712,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3187/500000] + train/ActionNoiseL2Loss=0.0915 + throughput/total_tokens=611,904,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3188/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=612,096,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3189/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=612,288,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3190/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=612,480,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3191/500000] + train/ActionNoiseL2Loss=0.1043 + throughput/total_tokens=612,672,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3192/500000] + train/ActionNoiseL2Loss=0.1419 + throughput/total_tokens=612,864,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3193/500000] + train/ActionNoiseL2Loss=0.0924 + throughput/total_tokens=613,056,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3194/500000] + train/ActionNoiseL2Loss=0.0977 + throughput/total_tokens=613,248,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3195/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=613,440,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3196/500000] + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=613,632,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3197/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=613,824,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3198/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=614,016,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3199/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=614,208,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3200/500000] + optim/total_grad_norm=1.612 + train/ActionNoiseL2Loss=0.0970 + throughput/total_tokens=614,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3201/500000] + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=614,592,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3202/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=614,784,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3203/500000] + train/ActionNoiseL2Loss=0.1054 + throughput/total_tokens=614,976,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3204/500000] + train/ActionNoiseL2Loss=0.0947 + throughput/total_tokens=615,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3205/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=615,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3206/500000] + train/ActionNoiseL2Loss=0.1049 + throughput/total_tokens=615,552,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3207/500000] + train/ActionNoiseL2Loss=0.0976 + throughput/total_tokens=615,744,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3208/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=615,936,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3209/500000] + train/ActionNoiseL2Loss=0.0939 + throughput/total_tokens=616,128,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3210/500000] + train/ActionNoiseL2Loss=0.1164 + throughput/total_tokens=616,320,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3211/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=616,512,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3212/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=616,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3213/500000] + train/ActionNoiseL2Loss=0.1062 + throughput/total_tokens=616,896,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3214/500000] + train/ActionNoiseL2Loss=0.1500 + throughput/total_tokens=617,088,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3215/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=617,280,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3216/500000] + train/ActionNoiseL2Loss=0.1111 + throughput/total_tokens=617,472,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3217/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=617,664,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3218/500000] + train/ActionNoiseL2Loss=0.1020 + throughput/total_tokens=617,856,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3219/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=618,048,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3220/500000] + optim/total_grad_norm=1.079 + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=618,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3221/500000] + train/ActionNoiseL2Loss=0.0910 + throughput/total_tokens=618,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3222/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=618,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3223/500000] + train/ActionNoiseL2Loss=0.0790 + throughput/total_tokens=618,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3224/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=619,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3225/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=619,200,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3226/500000] + train/ActionNoiseL2Loss=0.0345 + throughput/total_tokens=619,392,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3227/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=619,584,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3228/500000] + train/ActionNoiseL2Loss=0.1339 + throughput/total_tokens=619,776,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3229/500000] + train/ActionNoiseL2Loss=0.0926 + throughput/total_tokens=619,968,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3230/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=620,160,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3231/500000] + train/ActionNoiseL2Loss=0.1034 + throughput/total_tokens=620,352,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3232/500000] + train/ActionNoiseL2Loss=0.1362 + throughput/total_tokens=620,544,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3233/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=620,736,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3234/500000] + train/ActionNoiseL2Loss=0.1678 + throughput/total_tokens=620,928,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3235/500000] + train/ActionNoiseL2Loss=0.0879 + throughput/total_tokens=621,120,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3236/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=621,312,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3237/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=621,504,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3238/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=621,696,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3239/500000] + train/ActionNoiseL2Loss=0.0988 + throughput/total_tokens=621,888,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3240/500000] + optim/total_grad_norm=2.372 + train/ActionNoiseL2Loss=0.1015 + throughput/total_tokens=622,080,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3241/500000] + train/ActionNoiseL2Loss=0.0969 + throughput/total_tokens=622,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3242/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=622,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3243/500000] + train/ActionNoiseL2Loss=0.0959 + throughput/total_tokens=622,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3244/500000] + train/ActionNoiseL2Loss=0.1225 + throughput/total_tokens=622,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3245/500000] + train/ActionNoiseL2Loss=0.1133 + throughput/total_tokens=623,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3246/500000] + train/ActionNoiseL2Loss=0.1005 + throughput/total_tokens=623,232,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3247/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=623,424,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3248/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=623,616,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3249/500000] + train/ActionNoiseL2Loss=0.0848 + throughput/total_tokens=623,808,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3250/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=624,000,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=3251/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=624,192,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3252/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=624,384,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3253/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=624,576,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3254/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=624,768,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3255/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=624,960,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3256/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=625,152,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3257/500000] + train/ActionNoiseL2Loss=0.1028 + throughput/total_tokens=625,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3258/500000] + train/ActionNoiseL2Loss=0.1007 + throughput/total_tokens=625,536,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3259/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=625,728,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3260/500000] + optim/total_grad_norm=1.296 + train/ActionNoiseL2Loss=0.0858 + throughput/total_tokens=625,920,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3261/500000] + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=626,112,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3262/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=626,304,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3263/500000] + train/ActionNoiseL2Loss=0.0997 + throughput/total_tokens=626,496,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3264/500000] + train/ActionNoiseL2Loss=0.0866 + throughput/total_tokens=626,688,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3265/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=626,880,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3266/500000] + train/ActionNoiseL2Loss=0.0894 + throughput/total_tokens=627,072,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3267/500000] + train/ActionNoiseL2Loss=0.1458 + throughput/total_tokens=627,264,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3268/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=627,456,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3269/500000] + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=627,648,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3270/500000] + train/ActionNoiseL2Loss=0.1375 + throughput/total_tokens=627,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3271/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=628,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3272/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=628,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3273/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=628,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3274/500000] + train/ActionNoiseL2Loss=0.1000 + throughput/total_tokens=628,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3275/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=628,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3276/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=628,992,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3277/500000] + train/ActionNoiseL2Loss=0.0910 + throughput/total_tokens=629,184,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3278/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=629,376,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3279/500000] + train/ActionNoiseL2Loss=0.0921 + throughput/total_tokens=629,568,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3280/500000] + optim/total_grad_norm=1.569 + train/ActionNoiseL2Loss=0.1266 + throughput/total_tokens=629,760,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3281/500000] + train/ActionNoiseL2Loss=0.0340 + throughput/total_tokens=629,952,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3282/500000] + train/ActionNoiseL2Loss=0.0747 + throughput/total_tokens=630,144,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3283/500000] + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=630,336,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3284/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=630,528,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3285/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=630,720,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3286/500000] + train/ActionNoiseL2Loss=0.1473 + throughput/total_tokens=630,912,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3287/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=631,104,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3288/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=631,296,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3289/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=631,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3290/500000] + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=631,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3291/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=631,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3292/500000] + train/ActionNoiseL2Loss=0.1162 + throughput/total_tokens=632,064,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3293/500000] + train/ActionNoiseL2Loss=0.1092 + throughput/total_tokens=632,256,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3294/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=632,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3295/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=632,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3296/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=632,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3297/500000] + train/ActionNoiseL2Loss=0.0958 + throughput/total_tokens=633,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3298/500000] + train/ActionNoiseL2Loss=0.0929 + throughput/total_tokens=633,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3299/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=633,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3300/500000] + optim/total_grad_norm=1.388 + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=633,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3301/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=633,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3302/500000] + train/ActionNoiseL2Loss=0.0922 + throughput/total_tokens=633,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3303/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=634,176,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3304/500000] + train/ActionNoiseL2Loss=0.1135 + throughput/total_tokens=634,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3305/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=634,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3306/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=634,752,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3307/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=634,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3308/500000] + train/ActionNoiseL2Loss=0.1237 + throughput/total_tokens=635,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3309/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=635,328,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3310/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=635,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3311/500000] + train/ActionNoiseL2Loss=0.0310 + throughput/total_tokens=635,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3312/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=635,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3313/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=636,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3314/500000] + train/ActionNoiseL2Loss=0.1149 + throughput/total_tokens=636,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3315/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=636,480,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3316/500000] + train/ActionNoiseL2Loss=0.1139 + throughput/total_tokens=636,672,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3317/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=636,864,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3318/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=637,056,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3319/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=637,248,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3320/500000] + optim/total_grad_norm=1.122 + train/ActionNoiseL2Loss=0.0939 + throughput/total_tokens=637,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3321/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=637,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3322/500000] + train/ActionNoiseL2Loss=0.1291 + throughput/total_tokens=637,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3323/500000] + train/ActionNoiseL2Loss=0.0826 + throughput/total_tokens=638,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3324/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=638,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3325/500000] + train/ActionNoiseL2Loss=0.1017 + throughput/total_tokens=638,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3326/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=638,592,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3327/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=638,784,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3328/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=638,976,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3329/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=639,168,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3330/500000] + train/ActionNoiseL2Loss=0.1293 + throughput/total_tokens=639,360,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3331/500000] + train/ActionNoiseL2Loss=0.0881 + throughput/total_tokens=639,552,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3332/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=639,744,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3333/500000] + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=639,936,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3334/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=640,128,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3335/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=640,320,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3336/500000] + train/ActionNoiseL2Loss=0.0943 + throughput/total_tokens=640,512,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3337/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=640,704,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3338/500000] + train/ActionNoiseL2Loss=0.0911 + throughput/total_tokens=640,896,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3339/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=641,088,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3340/500000] + optim/total_grad_norm=0.9450 + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=641,280,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3341/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=641,472,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3342/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=641,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3343/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=641,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3344/500000] + train/ActionNoiseL2Loss=0.0911 + throughput/total_tokens=642,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3345/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=642,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3346/500000] + train/ActionNoiseL2Loss=0.1329 + throughput/total_tokens=642,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3347/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=642,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3348/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=642,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3349/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=643,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3350/500000] + train/ActionNoiseL2Loss=0.0790 + throughput/total_tokens=643,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3351/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=643,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3352/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=643,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3353/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=643,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3354/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=643,968,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3355/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=644,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3356/500000] + train/ActionNoiseL2Loss=0.1066 + throughput/total_tokens=644,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3357/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=644,544,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3358/500000] + train/ActionNoiseL2Loss=0.1331 + throughput/total_tokens=644,736,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3359/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=644,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3360/500000] + optim/total_grad_norm=0.9897 + train/ActionNoiseL2Loss=0.0942 + throughput/total_tokens=645,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3361/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=645,312,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3362/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=645,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3363/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=645,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3364/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=645,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3365/500000] + train/ActionNoiseL2Loss=0.1660 + throughput/total_tokens=646,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3366/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=646,272,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3367/500000] + train/ActionNoiseL2Loss=0.1123 + throughput/total_tokens=646,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3368/500000] + train/ActionNoiseL2Loss=0.0876 + throughput/total_tokens=646,656,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3369/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=646,848,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3370/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=647,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3371/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=647,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3372/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=647,424,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3373/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=647,616,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3374/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=647,808,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3375/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=648,000,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3376/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=648,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3377/500000] + train/ActionNoiseL2Loss=0.0949 + throughput/total_tokens=648,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3378/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=648,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3379/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=648,768,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3380/500000] + optim/total_grad_norm=1.162 + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=648,960,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3381/500000] + train/ActionNoiseL2Loss=0.1048 + throughput/total_tokens=649,152,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3382/500000] + train/ActionNoiseL2Loss=0.1042 + throughput/total_tokens=649,344,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3383/500000] + train/ActionNoiseL2Loss=0.1218 + throughput/total_tokens=649,536,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3384/500000] + train/ActionNoiseL2Loss=0.1351 + throughput/total_tokens=649,728,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3385/500000] + train/ActionNoiseL2Loss=0.0884 + throughput/total_tokens=649,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3386/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=650,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3387/500000] + train/ActionNoiseL2Loss=0.0876 + throughput/total_tokens=650,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3388/500000] + train/ActionNoiseL2Loss=0.1091 + throughput/total_tokens=650,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3389/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=650,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3390/500000] + train/ActionNoiseL2Loss=0.1140 + throughput/total_tokens=650,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3391/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=651,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3392/500000] + train/ActionNoiseL2Loss=0.1048 + throughput/total_tokens=651,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3393/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=651,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3394/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=651,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3395/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=651,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3396/500000] + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=652,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3397/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=652,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3398/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=652,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3399/500000] + train/ActionNoiseL2Loss=0.0918 + throughput/total_tokens=652,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3400/500000] + optim/total_grad_norm=1.165 + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=652,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3401/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=652,992,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=3402/500000] + train/ActionNoiseL2Loss=0.1134 + throughput/total_tokens=653,184,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=3403/500000] + train/ActionNoiseL2Loss=0.1047 + throughput/total_tokens=653,376,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=3404/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=653,568,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=3405/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=653,760,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=3406/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=653,952,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=3407/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=654,144,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=3408/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=654,336,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=3409/500000] + train/ActionNoiseL2Loss=0.1069 + throughput/total_tokens=654,528,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=3410/500000] + train/ActionNoiseL2Loss=0.1241 + throughput/total_tokens=654,720,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 + System/Peak GPU Memory (MB)=51,076 +[step=3411/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=654,912,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=3412/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=655,104,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=3413/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=655,296,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0475 +[step=3414/500000] + train/ActionNoiseL2Loss=0.0838 + throughput/total_tokens=655,488,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=3415/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=655,680,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0475 +[step=3416/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=655,872,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=3417/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=656,064,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=3418/500000] + train/ActionNoiseL2Loss=0.1214 + throughput/total_tokens=656,256,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=3419/500000] + train/ActionNoiseL2Loss=0.1517 + throughput/total_tokens=656,448,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=3420/500000] + optim/total_grad_norm=1.470 + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=656,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3421/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=656,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3422/500000] + train/ActionNoiseL2Loss=0.1078 + throughput/total_tokens=657,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3423/500000] + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=657,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3424/500000] + train/ActionNoiseL2Loss=0.1041 + throughput/total_tokens=657,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3425/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=657,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3426/500000] + train/ActionNoiseL2Loss=0.1147 + throughput/total_tokens=657,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3427/500000] + train/ActionNoiseL2Loss=0.0916 + throughput/total_tokens=657,984,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3428/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=658,176,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3429/500000] + train/ActionNoiseL2Loss=0.1244 + throughput/total_tokens=658,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3430/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=658,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3431/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=658,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3432/500000] + train/ActionNoiseL2Loss=0.0998 + throughput/total_tokens=658,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3433/500000] + train/ActionNoiseL2Loss=0.0921 + throughput/total_tokens=659,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3434/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=659,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3435/500000] + train/ActionNoiseL2Loss=0.1035 + throughput/total_tokens=659,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3436/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=659,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3437/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=659,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3438/500000] + train/ActionNoiseL2Loss=0.0947 + throughput/total_tokens=660,096,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3439/500000] + train/ActionNoiseL2Loss=0.0901 + throughput/total_tokens=660,288,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3440/500000] + optim/total_grad_norm=1.800 + train/ActionNoiseL2Loss=0.1407 + throughput/total_tokens=660,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3441/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=660,672,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3442/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=660,864,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3443/500000] + train/ActionNoiseL2Loss=0.1183 + throughput/total_tokens=661,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3444/500000] + train/ActionNoiseL2Loss=0.0934 + throughput/total_tokens=661,248,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3445/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=661,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3446/500000] + train/ActionNoiseL2Loss=0.0879 + throughput/total_tokens=661,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3447/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=661,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3448/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=662,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3449/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=662,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3450/500000] + train/ActionNoiseL2Loss=0.0893 + throughput/total_tokens=662,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3451/500000] + train/ActionNoiseL2Loss=0.0961 + throughput/total_tokens=662,592,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3452/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=662,784,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3453/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=662,976,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3454/500000] + train/ActionNoiseL2Loss=0.0919 + throughput/total_tokens=663,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3455/500000] + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=663,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3456/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=663,552,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3457/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=663,744,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3458/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=663,936,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3459/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=664,128,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3460/500000] + optim/total_grad_norm=1.676 + train/ActionNoiseL2Loss=0.1137 + throughput/total_tokens=664,320,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=3461/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=664,512,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3462/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=664,704,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3463/500000] + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=664,896,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3464/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=665,088,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3465/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=665,280,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3466/500000] + train/ActionNoiseL2Loss=0.1396 + throughput/total_tokens=665,472,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3467/500000] + train/ActionNoiseL2Loss=0.1571 + throughput/total_tokens=665,664,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3468/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=665,856,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3469/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=666,048,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3470/500000] + train/ActionNoiseL2Loss=0.1020 + throughput/total_tokens=666,240,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3471/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=666,432,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3472/500000] + train/ActionNoiseL2Loss=0.1391 + throughput/total_tokens=666,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3473/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=666,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3474/500000] + train/ActionNoiseL2Loss=0.0923 + throughput/total_tokens=667,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3475/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=667,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3476/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=667,392,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3477/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=667,584,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3478/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=667,776,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3479/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=667,968,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3480/500000] + optim/total_grad_norm=0.8480 + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=668,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=3481/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=668,352,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3482/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=668,544,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3483/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=668,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3484/500000] + train/ActionNoiseL2Loss=0.1263 + throughput/total_tokens=668,928,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3485/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=669,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3486/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=669,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3487/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=669,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3488/500000] + train/ActionNoiseL2Loss=0.1093 + throughput/total_tokens=669,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3489/500000] + train/ActionNoiseL2Loss=0.1010 + throughput/total_tokens=669,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3490/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=670,080,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=3491/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=670,272,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3492/500000] + train/ActionNoiseL2Loss=0.1404 + throughput/total_tokens=670,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3493/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=670,656,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3494/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=670,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3495/500000] + train/ActionNoiseL2Loss=0.0977 + throughput/total_tokens=671,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3496/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=671,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3497/500000] + train/ActionNoiseL2Loss=0.1566 + throughput/total_tokens=671,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3498/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=671,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3499/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=671,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3500/500000] + optim/total_grad_norm=1.038 + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=672,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +10/12 [13:30:38] INFO | >> Saving config... checkpoint.py:608 +10/12 [13:31:13] INFO | >> Saving model state... checkpoint.py:796 +10/12 [13:32:25] INFO | >> Saving optim state... checkpoint.py:811 +10/12 [13:33:57] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=3501/500000] + train/ActionNoiseL2Loss=0.0849 + throughput/total_tokens=672,192,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=3502/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=672,384,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=3503/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=672,576,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=3504/500000] + train/ActionNoiseL2Loss=0.1229 + throughput/total_tokens=672,768,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3505/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=672,960,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3506/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=673,152,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3507/500000] + train/ActionNoiseL2Loss=0.0944 + throughput/total_tokens=673,344,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3508/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=673,536,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3509/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=673,728,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3510/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=673,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3511/500000] + train/ActionNoiseL2Loss=0.1338 + throughput/total_tokens=674,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3512/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=674,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3513/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=674,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3514/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=674,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3515/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=674,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3516/500000] + train/ActionNoiseL2Loss=0.0941 + throughput/total_tokens=675,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3517/500000] + train/ActionNoiseL2Loss=0.1079 + throughput/total_tokens=675,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3518/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=675,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3519/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=675,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3520/500000] + optim/total_grad_norm=1.349 + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=675,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3521/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=676,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3522/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=676,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3523/500000] + train/ActionNoiseL2Loss=0.1281 + throughput/total_tokens=676,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3524/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=676,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3525/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=676,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3526/500000] + train/ActionNoiseL2Loss=0.0785 + throughput/total_tokens=676,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3527/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=677,184,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3528/500000] + train/ActionNoiseL2Loss=0.1046 + throughput/total_tokens=677,376,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3529/500000] + train/ActionNoiseL2Loss=0.0741 + throughput/total_tokens=677,568,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3530/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=677,760,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3531/500000] + train/ActionNoiseL2Loss=0.0941 + throughput/total_tokens=677,952,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3532/500000] + train/ActionNoiseL2Loss=0.0359 + throughput/total_tokens=678,144,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3533/500000] + train/ActionNoiseL2Loss=0.1428 + throughput/total_tokens=678,336,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3534/500000] + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=678,528,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3535/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=678,720,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3536/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=678,912,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3537/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=679,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3538/500000] + train/ActionNoiseL2Loss=0.1165 + throughput/total_tokens=679,296,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3539/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=679,488,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3540/500000] + optim/total_grad_norm=1.472 + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=679,680,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3541/500000] + train/ActionNoiseL2Loss=0.0747 + throughput/total_tokens=679,872,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3542/500000] + train/ActionNoiseL2Loss=0.0279 + throughput/total_tokens=680,064,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3543/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=680,256,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3544/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=680,448,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3545/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=680,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3546/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=680,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3547/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=681,024,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3548/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=681,216,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3549/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=681,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3550/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=681,600,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3551/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=681,792,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3552/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=681,984,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3553/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=682,176,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3554/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=682,368,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3555/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=682,560,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3556/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=682,752,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3557/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=682,944,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3558/500000] + train/ActionNoiseL2Loss=0.1146 + throughput/total_tokens=683,136,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3559/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=683,328,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3560/500000] + optim/total_grad_norm=0.9341 + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=683,520,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=3561/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=683,712,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3562/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=683,904,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3563/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=684,096,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3564/500000] + train/ActionNoiseL2Loss=0.1086 + throughput/total_tokens=684,288,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3565/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=684,480,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3566/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=684,672,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3567/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=684,864,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3568/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=685,056,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3569/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=685,248,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3570/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=685,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3571/500000] + train/ActionNoiseL2Loss=0.0975 + throughput/total_tokens=685,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3572/500000] + train/ActionNoiseL2Loss=0.1096 + throughput/total_tokens=685,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3573/500000] + train/ActionNoiseL2Loss=0.1320 + throughput/total_tokens=686,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3574/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=686,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3575/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=686,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3576/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=686,592,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3577/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=686,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3578/500000] + train/ActionNoiseL2Loss=0.1021 + throughput/total_tokens=686,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3579/500000] + train/ActionNoiseL2Loss=0.1195 + throughput/total_tokens=687,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3580/500000] + optim/total_grad_norm=1.111 + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=687,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3581/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=687,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3582/500000] + train/ActionNoiseL2Loss=0.1163 + throughput/total_tokens=687,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3583/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=687,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3584/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=688,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3585/500000] + train/ActionNoiseL2Loss=0.1019 + throughput/total_tokens=688,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3586/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=688,512,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3587/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=688,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3588/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=688,896,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3589/500000] + train/ActionNoiseL2Loss=0.1733 + throughput/total_tokens=689,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3590/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=689,280,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3591/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=689,472,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3592/500000] + train/ActionNoiseL2Loss=0.1340 + throughput/total_tokens=689,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3593/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=689,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3594/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=690,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3595/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=690,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3596/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=690,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3597/500000] + train/ActionNoiseL2Loss=0.1019 + throughput/total_tokens=690,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3598/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=690,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3599/500000] + train/ActionNoiseL2Loss=0.0992 + throughput/total_tokens=691,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3600/500000] + optim/total_grad_norm=0.9945 + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=691,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3601/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=691,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3602/500000] + train/ActionNoiseL2Loss=0.1016 + throughput/total_tokens=691,584,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3603/500000] + train/ActionNoiseL2Loss=0.1456 + throughput/total_tokens=691,776,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3604/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=691,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3605/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=692,160,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3606/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=692,352,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3607/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=692,544,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3608/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=692,736,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3609/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=692,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3610/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=693,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3611/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=693,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3612/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=693,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3613/500000] + train/ActionNoiseL2Loss=0.1100 + throughput/total_tokens=693,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3614/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=693,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3615/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=694,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3616/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=694,272,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3617/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=694,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3618/500000] + train/ActionNoiseL2Loss=0.1573 + throughput/total_tokens=694,656,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3619/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=694,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3620/500000] + optim/total_grad_norm=0.9518 + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=695,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3621/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=695,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3622/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=695,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3623/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=695,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3624/500000] + train/ActionNoiseL2Loss=0.0832 + throughput/total_tokens=695,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3625/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=696,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3626/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=696,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3627/500000] + train/ActionNoiseL2Loss=0.1533 + throughput/total_tokens=696,384,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3628/500000] + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=696,576,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3629/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=696,768,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3630/500000] + train/ActionNoiseL2Loss=0.1577 + throughput/total_tokens=696,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3631/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=697,152,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3632/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=697,344,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3633/500000] + train/ActionNoiseL2Loss=0.0877 + throughput/total_tokens=697,536,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3634/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=697,728,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3635/500000] + train/ActionNoiseL2Loss=0.1356 + throughput/total_tokens=697,920,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3636/500000] + train/ActionNoiseL2Loss=0.1221 + throughput/total_tokens=698,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3637/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=698,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3638/500000] + train/ActionNoiseL2Loss=0.1215 + throughput/total_tokens=698,496,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3639/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=698,688,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3640/500000] + optim/total_grad_norm=1.102 + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=698,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3641/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=699,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3642/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=699,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3643/500000] + train/ActionNoiseL2Loss=0.1148 + throughput/total_tokens=699,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3644/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=699,648,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3645/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=699,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3646/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=700,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3647/500000] + train/ActionNoiseL2Loss=0.2028 + throughput/total_tokens=700,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3648/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=700,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3649/500000] + train/ActionNoiseL2Loss=0.0983 + throughput/total_tokens=700,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3650/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=700,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3651/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=700,992,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3652/500000] + train/ActionNoiseL2Loss=0.0741 + throughput/total_tokens=701,184,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3653/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=701,376,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3654/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=701,568,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3655/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=701,760,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3656/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=701,952,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3657/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=702,144,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3658/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=702,336,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3659/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=702,528,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3660/500000] + optim/total_grad_norm=1.154 + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=702,720,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=3661/500000] + train/ActionNoiseL2Loss=0.1097 + throughput/total_tokens=702,912,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3662/500000] + train/ActionNoiseL2Loss=0.0949 + throughput/total_tokens=703,104,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3663/500000] + train/ActionNoiseL2Loss=0.1030 + throughput/total_tokens=703,296,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3664/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=703,488,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3665/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=703,680,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3666/500000] + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=703,872,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3667/500000] + train/ActionNoiseL2Loss=0.1015 + throughput/total_tokens=704,064,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3668/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=704,256,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3669/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=704,448,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3670/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=704,640,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3671/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=704,832,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3672/500000] + train/ActionNoiseL2Loss=0.0863 + throughput/total_tokens=705,024,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3673/500000] + train/ActionNoiseL2Loss=0.0256 + throughput/total_tokens=705,216,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3674/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=705,408,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3675/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=705,600,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3676/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=705,792,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3677/500000] + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=705,984,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3678/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=706,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3679/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=706,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3680/500000] + optim/total_grad_norm=1.021 + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=706,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3681/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=706,752,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3682/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=706,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3683/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=707,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3684/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=707,328,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3685/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=707,520,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3686/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=707,712,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3687/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=707,904,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3688/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=708,096,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3689/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=708,288,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3690/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=708,480,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3691/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=708,672,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3692/500000] + train/ActionNoiseL2Loss=0.1016 + throughput/total_tokens=708,864,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3693/500000] + train/ActionNoiseL2Loss=0.0866 + throughput/total_tokens=709,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3694/500000] + train/ActionNoiseL2Loss=0.1395 + throughput/total_tokens=709,248,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3695/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=709,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3696/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=709,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3697/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=709,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3698/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=710,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3699/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=710,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3700/500000] + optim/total_grad_norm=0.9666 + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=710,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3701/500000] + train/ActionNoiseL2Loss=0.0809 + throughput/total_tokens=710,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3702/500000] + train/ActionNoiseL2Loss=0.1056 + throughput/total_tokens=710,784,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3703/500000] + train/ActionNoiseL2Loss=0.1020 + throughput/total_tokens=710,976,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3704/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=711,168,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3705/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=711,360,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3706/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=711,552,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3707/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=711,744,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3708/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=711,936,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3709/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=712,128,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3710/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=712,320,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3711/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=712,512,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3712/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=712,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3713/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=712,896,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3714/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=713,088,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3715/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=713,280,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3716/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=713,472,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3717/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=713,664,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3718/500000] + train/ActionNoiseL2Loss=0.0924 + throughput/total_tokens=713,856,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3719/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=714,048,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3720/500000] + optim/total_grad_norm=1.770 + train/ActionNoiseL2Loss=0.0892 + throughput/total_tokens=714,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3721/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=714,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3722/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=714,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3723/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=714,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3724/500000] + train/ActionNoiseL2Loss=0.0911 + throughput/total_tokens=715,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3725/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=715,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3726/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=715,392,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3727/500000] + train/ActionNoiseL2Loss=0.1071 + throughput/total_tokens=715,584,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3728/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=715,776,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3729/500000] + train/ActionNoiseL2Loss=0.1009 + throughput/total_tokens=715,968,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3730/500000] + train/ActionNoiseL2Loss=0.0934 + throughput/total_tokens=716,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=3731/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=716,352,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3732/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=716,544,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3733/500000] + train/ActionNoiseL2Loss=0.1307 + throughput/total_tokens=716,736,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3734/500000] + train/ActionNoiseL2Loss=0.0937 + throughput/total_tokens=716,928,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3735/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=717,120,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3736/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=717,312,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3737/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=717,504,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3738/500000] + train/ActionNoiseL2Loss=0.0943 + throughput/total_tokens=717,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3739/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=717,888,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3740/500000] + optim/total_grad_norm=0.9913 + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=718,080,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=3741/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=718,272,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3742/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=718,464,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3743/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=718,656,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3744/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=718,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3745/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=719,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3746/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=719,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3747/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=719,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3748/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=719,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3749/500000] + train/ActionNoiseL2Loss=0.0927 + throughput/total_tokens=719,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3750/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=720,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3751/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=720,192,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3752/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=720,384,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3753/500000] + train/ActionNoiseL2Loss=0.1335 + throughput/total_tokens=720,576,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3754/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=720,768,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3755/500000] + train/ActionNoiseL2Loss=0.0691 + throughput/total_tokens=720,960,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3756/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=721,152,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3757/500000] + train/ActionNoiseL2Loss=0.1016 + throughput/total_tokens=721,344,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3758/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=721,536,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3759/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=721,728,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3760/500000] + optim/total_grad_norm=0.8354 + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=721,920,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=3761/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=722,112,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3762/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=722,304,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3763/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=722,496,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3764/500000] + train/ActionNoiseL2Loss=0.0820 + throughput/total_tokens=722,688,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3765/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=722,880,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3766/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=723,072,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3767/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=723,264,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3768/500000] + train/ActionNoiseL2Loss=0.0945 + throughput/total_tokens=723,456,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3769/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=723,648,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3770/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=723,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3771/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=724,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3772/500000] + train/ActionNoiseL2Loss=0.0867 + throughput/total_tokens=724,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3773/500000] + train/ActionNoiseL2Loss=0.1449 + throughput/total_tokens=724,416,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3774/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=724,608,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3775/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=724,800,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3776/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=724,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3777/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=725,184,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3778/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=725,376,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3779/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=725,568,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3780/500000] + optim/total_grad_norm=0.8398 + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=725,760,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3781/500000] + train/ActionNoiseL2Loss=0.1180 + throughput/total_tokens=725,952,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3782/500000] + train/ActionNoiseL2Loss=0.0792 + throughput/total_tokens=726,144,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3783/500000] + train/ActionNoiseL2Loss=0.1028 + throughput/total_tokens=726,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3784/500000] + train/ActionNoiseL2Loss=0.0963 + throughput/total_tokens=726,528,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3785/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=726,720,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3786/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=726,912,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3787/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=727,104,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3788/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=727,296,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3789/500000] + train/ActionNoiseL2Loss=0.1800 + throughput/total_tokens=727,488,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3790/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=727,680,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3791/500000] + train/ActionNoiseL2Loss=0.1155 + throughput/total_tokens=727,872,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3792/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=728,064,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3793/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=728,256,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3794/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=728,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3795/500000] + train/ActionNoiseL2Loss=0.0282 + throughput/total_tokens=728,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3796/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=728,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3797/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=729,024,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3798/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=729,216,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3799/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=729,408,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3800/500000] + optim/total_grad_norm=1.674 + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=729,600,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3801/500000] + train/ActionNoiseL2Loss=0.1225 + throughput/total_tokens=729,792,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=3802/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=729,984,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=3803/500000] + train/ActionNoiseL2Loss=0.1169 + throughput/total_tokens=730,176,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=3804/500000] + train/ActionNoiseL2Loss=0.1078 + throughput/total_tokens=730,368,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=3805/500000] + train/ActionNoiseL2Loss=0.0877 + throughput/total_tokens=730,560,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=3806/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=730,752,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3807/500000] + train/ActionNoiseL2Loss=0.0923 + throughput/total_tokens=730,944,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3808/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=731,136,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3809/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=731,328,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3810/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=731,520,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=3811/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=731,712,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=3812/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=731,904,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3813/500000] + train/ActionNoiseL2Loss=0.1031 + throughput/total_tokens=732,096,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3814/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=732,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3815/500000] + train/ActionNoiseL2Loss=0.1127 + throughput/total_tokens=732,480,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3816/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=732,672,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3817/500000] + train/ActionNoiseL2Loss=0.0858 + throughput/total_tokens=732,864,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3818/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=733,056,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3819/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=733,248,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3820/500000] + optim/total_grad_norm=0.9675 + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=733,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=3821/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=733,632,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3822/500000] + train/ActionNoiseL2Loss=0.0976 + throughput/total_tokens=733,824,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3823/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=734,016,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3824/500000] + train/ActionNoiseL2Loss=0.0823 + throughput/total_tokens=734,208,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3825/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=734,400,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3826/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=734,592,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3827/500000] + train/ActionNoiseL2Loss=0.0820 + throughput/total_tokens=734,784,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3828/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=734,976,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3829/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=735,168,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3830/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=735,360,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=3831/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=735,552,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3832/500000] + train/ActionNoiseL2Loss=0.1267 + throughput/total_tokens=735,744,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3833/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=735,936,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3834/500000] + train/ActionNoiseL2Loss=0.1141 + throughput/total_tokens=736,128,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3835/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=736,320,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3836/500000] + train/ActionNoiseL2Loss=0.0991 + throughput/total_tokens=736,512,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3837/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=736,704,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3838/500000] + train/ActionNoiseL2Loss=0.0916 + throughput/total_tokens=736,896,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3839/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=737,088,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3840/500000] + optim/total_grad_norm=0.9865 + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=737,280,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=3841/500000] + train/ActionNoiseL2Loss=0.1235 + throughput/total_tokens=737,472,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3842/500000] + train/ActionNoiseL2Loss=0.1271 + throughput/total_tokens=737,664,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3843/500000] + train/ActionNoiseL2Loss=0.0906 + throughput/total_tokens=737,856,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3844/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=738,048,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3845/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=738,240,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3846/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=738,432,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3847/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=738,624,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3848/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=738,816,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3849/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=739,008,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3850/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=739,200,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=3851/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=739,392,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3852/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=739,584,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3853/500000] + train/ActionNoiseL2Loss=0.0922 + throughput/total_tokens=739,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3854/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=739,968,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3855/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=740,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3856/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=740,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3857/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=740,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3858/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=740,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3859/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=740,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3860/500000] + optim/total_grad_norm=1.200 + train/ActionNoiseL2Loss=0.1071 + throughput/total_tokens=741,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3861/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=741,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3862/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=741,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3863/500000] + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=741,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3864/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=741,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3865/500000] + train/ActionNoiseL2Loss=0.1048 + throughput/total_tokens=742,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3866/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=742,272,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3867/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=742,464,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3868/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=742,656,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3869/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=742,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3870/500000] + train/ActionNoiseL2Loss=0.1079 + throughput/total_tokens=743,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3871/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=743,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3872/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=743,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3873/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=743,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3874/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=743,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3875/500000] + train/ActionNoiseL2Loss=0.1281 + throughput/total_tokens=744,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3876/500000] + train/ActionNoiseL2Loss=0.1480 + throughput/total_tokens=744,192,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3877/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=744,384,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3878/500000] + train/ActionNoiseL2Loss=0.0691 + throughput/total_tokens=744,576,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3879/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=744,768,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3880/500000] + optim/total_grad_norm=1.257 + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=744,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=3881/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=745,152,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3882/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=745,344,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3883/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=745,536,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3884/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=745,728,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3885/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=745,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3886/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=746,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3887/500000] + train/ActionNoiseL2Loss=0.1198 + throughput/total_tokens=746,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3888/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=746,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3889/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=746,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3890/500000] + train/ActionNoiseL2Loss=0.0947 + throughput/total_tokens=746,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3891/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=747,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3892/500000] + train/ActionNoiseL2Loss=0.1052 + throughput/total_tokens=747,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3893/500000] + train/ActionNoiseL2Loss=0.0978 + throughput/total_tokens=747,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3894/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=747,648,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3895/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=747,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3896/500000] + train/ActionNoiseL2Loss=0.1226 + throughput/total_tokens=748,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3897/500000] + train/ActionNoiseL2Loss=0.1093 + throughput/total_tokens=748,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3898/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=748,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3899/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=748,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3900/500000] + optim/total_grad_norm=1.035 + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=748,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3901/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=748,992,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3902/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=749,184,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3903/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=749,376,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3904/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=749,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3905/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=749,760,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3906/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=749,952,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3907/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=750,144,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3908/500000] + train/ActionNoiseL2Loss=0.1339 + throughput/total_tokens=750,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3909/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=750,528,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3910/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=750,720,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=3911/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=750,912,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3912/500000] + train/ActionNoiseL2Loss=0.0991 + throughput/total_tokens=751,104,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3913/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=751,296,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3914/500000] + train/ActionNoiseL2Loss=0.1044 + throughput/total_tokens=751,488,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3915/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=751,680,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3916/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=751,872,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3917/500000] + train/ActionNoiseL2Loss=0.1063 + throughput/total_tokens=752,064,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3918/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=752,256,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3919/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=752,448,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=3920/500000] + optim/total_grad_norm=0.8781 + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=752,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3921/500000] + train/ActionNoiseL2Loss=0.0937 + throughput/total_tokens=752,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3922/500000] + train/ActionNoiseL2Loss=0.1254 + throughput/total_tokens=753,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3923/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=753,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3924/500000] + train/ActionNoiseL2Loss=0.0950 + throughput/total_tokens=753,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3925/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=753,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3926/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=753,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3927/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=753,984,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3928/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=754,176,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3929/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=754,368,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3930/500000] + train/ActionNoiseL2Loss=0.0867 + throughput/total_tokens=754,560,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3931/500000] + train/ActionNoiseL2Loss=0.1320 + throughput/total_tokens=754,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3932/500000] + train/ActionNoiseL2Loss=0.0970 + throughput/total_tokens=754,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3933/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=755,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3934/500000] + train/ActionNoiseL2Loss=0.0902 + throughput/total_tokens=755,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3935/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=755,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3936/500000] + train/ActionNoiseL2Loss=0.0370 + throughput/total_tokens=755,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3937/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=755,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3938/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=756,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3939/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=756,288,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3940/500000] + optim/total_grad_norm=2.023 + train/ActionNoiseL2Loss=0.1309 + throughput/total_tokens=756,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3941/500000] + train/ActionNoiseL2Loss=0.0927 + throughput/total_tokens=756,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3942/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=756,864,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3943/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=757,056,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3944/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=757,248,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3945/500000] + train/ActionNoiseL2Loss=0.0892 + throughput/total_tokens=757,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3946/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=757,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3947/500000] + train/ActionNoiseL2Loss=0.1192 + throughput/total_tokens=757,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3948/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=758,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3949/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=758,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=3950/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=758,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3951/500000] + train/ActionNoiseL2Loss=0.0785 + throughput/total_tokens=758,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3952/500000] + train/ActionNoiseL2Loss=0.1086 + throughput/total_tokens=758,784,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3953/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=758,976,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3954/500000] + train/ActionNoiseL2Loss=0.0944 + throughput/total_tokens=759,168,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3955/500000] + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=759,360,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3956/500000] + train/ActionNoiseL2Loss=0.1075 + throughput/total_tokens=759,552,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=3957/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=759,744,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=3958/500000] + train/ActionNoiseL2Loss=0.0961 + throughput/total_tokens=759,936,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3959/500000] + train/ActionNoiseL2Loss=0.0826 + throughput/total_tokens=760,128,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3960/500000] + optim/total_grad_norm=1.261 + train/ActionNoiseL2Loss=0.1318 + throughput/total_tokens=760,320,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=3961/500000] + train/ActionNoiseL2Loss=0.0999 + throughput/total_tokens=760,512,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3962/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=760,704,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3963/500000] + train/ActionNoiseL2Loss=0.0863 + throughput/total_tokens=760,896,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3964/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=761,088,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3965/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=761,280,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3966/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=761,472,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3967/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=761,664,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3968/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=761,856,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3969/500000] + train/ActionNoiseL2Loss=0.0943 + throughput/total_tokens=762,048,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=3970/500000] + train/ActionNoiseL2Loss=0.1534 + throughput/total_tokens=762,240,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=3971/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=762,432,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3972/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=762,624,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3973/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=762,816,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3974/500000] + train/ActionNoiseL2Loss=0.0752 + throughput/total_tokens=763,008,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3975/500000] + train/ActionNoiseL2Loss=0.0876 + throughput/total_tokens=763,200,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3976/500000] + train/ActionNoiseL2Loss=0.0966 + throughput/total_tokens=763,392,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3977/500000] + train/ActionNoiseL2Loss=0.0993 + throughput/total_tokens=763,584,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3978/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=763,776,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3979/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=763,968,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3980/500000] + optim/total_grad_norm=0.8674 + train/ActionNoiseL2Loss=0.1099 + throughput/total_tokens=764,160,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=3981/500000] + train/ActionNoiseL2Loss=0.1070 + throughput/total_tokens=764,352,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3982/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=764,544,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3983/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=764,736,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3984/500000] + train/ActionNoiseL2Loss=0.0924 + throughput/total_tokens=764,928,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3985/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=765,120,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3986/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=765,312,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3987/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=765,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3988/500000] + train/ActionNoiseL2Loss=0.0877 + throughput/total_tokens=765,696,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=3989/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=765,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3990/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=766,080,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=3991/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=766,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3992/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=766,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3993/500000] + train/ActionNoiseL2Loss=0.1050 + throughput/total_tokens=766,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3994/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=766,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3995/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=767,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3996/500000] + train/ActionNoiseL2Loss=0.0872 + throughput/total_tokens=767,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=3997/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=767,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3998/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=767,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=3999/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=767,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4000/500000] + optim/total_grad_norm=1.343 + train/ActionNoiseL2Loss=0.1290 + throughput/total_tokens=768,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +10/12 [16:29:25] INFO | >> Saving config... checkpoint.py:608 +10/12 [16:30:06] INFO | >> Saving model state... checkpoint.py:796 +10/12 [16:31:16] INFO | >> Saving optim state... checkpoint.py:811 +10/12 [16:32:47] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=4001/500000] + train/ActionNoiseL2Loss=0.1023 + throughput/total_tokens=768,192,000 + throughput/device/tokens_per_second=1,137 + throughput/device/batches_per_second=0.0474 +[step=4002/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=768,384,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=4003/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=768,576,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=4004/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=768,768,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=4005/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=768,960,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=4006/500000] + train/ActionNoiseL2Loss=0.1177 + throughput/total_tokens=769,152,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4007/500000] + train/ActionNoiseL2Loss=0.0884 + throughput/total_tokens=769,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4008/500000] + train/ActionNoiseL2Loss=0.1069 + throughput/total_tokens=769,536,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4009/500000] + train/ActionNoiseL2Loss=0.1252 + throughput/total_tokens=769,728,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4010/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=769,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4011/500000] + train/ActionNoiseL2Loss=0.0966 + throughput/total_tokens=770,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4012/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=770,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4013/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=770,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4014/500000] + train/ActionNoiseL2Loss=0.1063 + throughput/total_tokens=770,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4015/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=770,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4016/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=771,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4017/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=771,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4018/500000] + train/ActionNoiseL2Loss=0.1182 + throughput/total_tokens=771,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4019/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=771,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4020/500000] + optim/total_grad_norm=1.502 + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=771,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4021/500000] + train/ActionNoiseL2Loss=0.1626 + throughput/total_tokens=772,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4022/500000] + train/ActionNoiseL2Loss=0.0939 + throughput/total_tokens=772,224,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4023/500000] + train/ActionNoiseL2Loss=0.1184 + throughput/total_tokens=772,416,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4024/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=772,608,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4025/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=772,800,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4026/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=772,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4027/500000] + train/ActionNoiseL2Loss=0.0942 + throughput/total_tokens=773,184,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4028/500000] + train/ActionNoiseL2Loss=0.0920 + throughput/total_tokens=773,376,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4029/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=773,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4030/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=773,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4031/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=773,952,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4032/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=774,144,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4033/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=774,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4034/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=774,528,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4035/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=774,720,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4036/500000] + train/ActionNoiseL2Loss=0.0790 + throughput/total_tokens=774,912,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4037/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=775,104,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4038/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=775,296,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4039/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=775,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4040/500000] + optim/total_grad_norm=1.264 + train/ActionNoiseL2Loss=0.0901 + throughput/total_tokens=775,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4041/500000] + train/ActionNoiseL2Loss=0.1192 + throughput/total_tokens=775,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4042/500000] + train/ActionNoiseL2Loss=0.0915 + throughput/total_tokens=776,064,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4043/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=776,256,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4044/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=776,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4045/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=776,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4046/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=776,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4047/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=777,024,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4048/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=777,216,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4049/500000] + train/ActionNoiseL2Loss=0.1255 + throughput/total_tokens=777,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4050/500000] + train/ActionNoiseL2Loss=0.1081 + throughput/total_tokens=777,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4051/500000] + train/ActionNoiseL2Loss=0.1014 + throughput/total_tokens=777,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4052/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=777,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4053/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=778,176,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4054/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=778,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4055/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=778,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4056/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=778,752,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4057/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=778,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4058/500000] + train/ActionNoiseL2Loss=0.0930 + throughput/total_tokens=779,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4059/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=779,328,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4060/500000] + optim/total_grad_norm=1.338 + train/ActionNoiseL2Loss=0.0840 + throughput/total_tokens=779,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=4061/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=779,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4062/500000] + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=779,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4063/500000] + train/ActionNoiseL2Loss=0.0972 + throughput/total_tokens=780,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4064/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=780,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4065/500000] + train/ActionNoiseL2Loss=0.1086 + throughput/total_tokens=780,480,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4066/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=780,672,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4067/500000] + train/ActionNoiseL2Loss=0.0969 + throughput/total_tokens=780,864,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4068/500000] + train/ActionNoiseL2Loss=0.1013 + throughput/total_tokens=781,056,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4069/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=781,248,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4070/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=781,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4071/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=781,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4072/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=781,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4073/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=782,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4074/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=782,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4075/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=782,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4076/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=782,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4077/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=782,784,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4078/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=782,976,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4079/500000] + train/ActionNoiseL2Loss=0.1281 + throughput/total_tokens=783,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4080/500000] + optim/total_grad_norm=0.8416 + train/ActionNoiseL2Loss=0.1004 + throughput/total_tokens=783,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4081/500000] + train/ActionNoiseL2Loss=0.0832 + throughput/total_tokens=783,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4082/500000] + train/ActionNoiseL2Loss=0.0836 + throughput/total_tokens=783,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4083/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=783,936,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4084/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=784,128,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4085/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=784,320,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4086/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=784,512,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4087/500000] + train/ActionNoiseL2Loss=0.1124 + throughput/total_tokens=784,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4088/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=784,896,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4089/500000] + train/ActionNoiseL2Loss=0.1168 + throughput/total_tokens=785,088,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4090/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=785,280,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4091/500000] + train/ActionNoiseL2Loss=0.0954 + throughput/total_tokens=785,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4092/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=785,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4093/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=785,856,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4094/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=786,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4095/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=786,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4096/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=786,432,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4097/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=786,624,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4098/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=786,816,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4099/500000] + train/ActionNoiseL2Loss=0.1056 + throughput/total_tokens=787,008,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4100/500000] + optim/total_grad_norm=1.167 + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=787,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4101/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=787,392,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4102/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=787,584,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4103/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=787,776,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4104/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=787,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4105/500000] + train/ActionNoiseL2Loss=0.0871 + throughput/total_tokens=788,160,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4106/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=788,352,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4107/500000] + train/ActionNoiseL2Loss=0.1173 + throughput/total_tokens=788,544,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4108/500000] + train/ActionNoiseL2Loss=0.1005 + throughput/total_tokens=788,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4109/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=788,928,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4110/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=789,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=4111/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=789,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4112/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=789,504,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4113/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=789,696,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4114/500000] + train/ActionNoiseL2Loss=0.0939 + throughput/total_tokens=789,888,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4115/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=790,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4116/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=790,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4117/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=790,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4118/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=790,656,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4119/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=790,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4120/500000] + optim/total_grad_norm=1.894 + train/ActionNoiseL2Loss=0.1259 + throughput/total_tokens=791,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4121/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=791,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4122/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=791,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4123/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=791,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4124/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=791,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4125/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=792,000,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4126/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=792,192,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4127/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=792,384,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4128/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=792,576,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4129/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=792,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4130/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=792,960,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4131/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=793,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4132/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=793,344,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4133/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=793,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4134/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=793,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4135/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=793,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4136/500000] + train/ActionNoiseL2Loss=0.0838 + throughput/total_tokens=794,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4137/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=794,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4138/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=794,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4139/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=794,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4140/500000] + optim/total_grad_norm=1.062 + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=794,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4141/500000] + train/ActionNoiseL2Loss=0.0824 + throughput/total_tokens=795,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4142/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=795,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4143/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=795,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4144/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=795,648,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4145/500000] + train/ActionNoiseL2Loss=0.0881 + throughput/total_tokens=795,840,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4146/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=796,032,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4147/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=796,224,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4148/500000] + train/ActionNoiseL2Loss=0.1401 + throughput/total_tokens=796,416,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4149/500000] + train/ActionNoiseL2Loss=0.1047 + throughput/total_tokens=796,608,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4150/500000] + train/ActionNoiseL2Loss=0.1063 + throughput/total_tokens=796,800,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4151/500000] + train/ActionNoiseL2Loss=0.1195 + throughput/total_tokens=796,992,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4152/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=797,184,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4153/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=797,376,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4154/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=797,568,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4155/500000] + train/ActionNoiseL2Loss=0.0851 + throughput/total_tokens=797,760,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4156/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=797,952,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4157/500000] + train/ActionNoiseL2Loss=0.1252 + throughput/total_tokens=798,144,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4158/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=798,336,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4159/500000] + train/ActionNoiseL2Loss=0.1277 + throughput/total_tokens=798,528,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4160/500000] + optim/total_grad_norm=1.311 + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=798,720,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4161/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=798,912,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4162/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=799,104,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4163/500000] + train/ActionNoiseL2Loss=0.0926 + throughput/total_tokens=799,296,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4164/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=799,488,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4165/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=799,680,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4166/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=799,872,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4167/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=800,064,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4168/500000] + train/ActionNoiseL2Loss=0.1244 + throughput/total_tokens=800,256,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4169/500000] + train/ActionNoiseL2Loss=0.1036 + throughput/total_tokens=800,448,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4170/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=800,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4171/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=800,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4172/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=801,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4173/500000] + train/ActionNoiseL2Loss=0.0827 + throughput/total_tokens=801,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4174/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=801,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4175/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=801,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4176/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=801,792,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4177/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=801,984,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4178/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=802,176,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4179/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=802,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4180/500000] + optim/total_grad_norm=0.8378 + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=802,560,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4181/500000] + train/ActionNoiseL2Loss=0.0865 + throughput/total_tokens=802,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4182/500000] + train/ActionNoiseL2Loss=0.1259 + throughput/total_tokens=802,944,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4183/500000] + train/ActionNoiseL2Loss=0.0788 + throughput/total_tokens=803,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4184/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=803,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4185/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=803,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4186/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=803,712,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4187/500000] + train/ActionNoiseL2Loss=0.1216 + throughput/total_tokens=803,904,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4188/500000] + train/ActionNoiseL2Loss=0.1219 + throughput/total_tokens=804,096,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4189/500000] + train/ActionNoiseL2Loss=0.1316 + throughput/total_tokens=804,288,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4190/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=804,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4191/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=804,672,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4192/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=804,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4193/500000] + train/ActionNoiseL2Loss=0.0942 + throughput/total_tokens=805,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4194/500000] + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=805,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4195/500000] + train/ActionNoiseL2Loss=0.1044 + throughput/total_tokens=805,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4196/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=805,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4197/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=805,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4198/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=806,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4199/500000] + train/ActionNoiseL2Loss=0.1052 + throughput/total_tokens=806,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4200/500000] + optim/total_grad_norm=1.249 + train/ActionNoiseL2Loss=0.1088 + throughput/total_tokens=806,400,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4201/500000] + train/ActionNoiseL2Loss=0.1289 + throughput/total_tokens=806,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4202/500000] + train/ActionNoiseL2Loss=0.0872 + throughput/total_tokens=806,784,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4203/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=806,976,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4204/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=807,168,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4205/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=807,360,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4206/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=807,552,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4207/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=807,744,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4208/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=807,936,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4209/500000] + train/ActionNoiseL2Loss=0.1336 + throughput/total_tokens=808,128,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4210/500000] + train/ActionNoiseL2Loss=0.0905 + throughput/total_tokens=808,320,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=4211/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=808,512,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4212/500000] + train/ActionNoiseL2Loss=0.1550 + throughput/total_tokens=808,704,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4213/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=808,896,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4214/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=809,088,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4215/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=809,280,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4216/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=809,472,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4217/500000] + train/ActionNoiseL2Loss=0.1428 + throughput/total_tokens=809,664,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4218/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=809,856,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4219/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=810,048,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4220/500000] + optim/total_grad_norm=0.7394 + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=810,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4221/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=810,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4222/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=810,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4223/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=810,816,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4224/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=811,008,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4225/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=811,200,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4226/500000] + train/ActionNoiseL2Loss=0.1356 + throughput/total_tokens=811,392,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4227/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=811,584,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4228/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=811,776,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4229/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=811,968,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4230/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=812,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4231/500000] + train/ActionNoiseL2Loss=0.0914 + throughput/total_tokens=812,352,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4232/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=812,544,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4233/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=812,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4234/500000] + train/ActionNoiseL2Loss=0.1066 + throughput/total_tokens=812,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4235/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=813,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4236/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=813,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4237/500000] + train/ActionNoiseL2Loss=0.0930 + throughput/total_tokens=813,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4238/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=813,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4239/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=813,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4240/500000] + optim/total_grad_norm=1.371 + train/ActionNoiseL2Loss=0.1053 + throughput/total_tokens=814,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4241/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=814,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4242/500000] + train/ActionNoiseL2Loss=0.0996 + throughput/total_tokens=814,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4243/500000] + train/ActionNoiseL2Loss=0.1647 + throughput/total_tokens=814,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4244/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=814,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4245/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=815,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4246/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=815,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4247/500000] + train/ActionNoiseL2Loss=0.1340 + throughput/total_tokens=815,424,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4248/500000] + train/ActionNoiseL2Loss=0.0985 + throughput/total_tokens=815,616,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4249/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=815,808,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4250/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=816,000,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4251/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=816,192,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4252/500000] + train/ActionNoiseL2Loss=0.1394 + throughput/total_tokens=816,384,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4253/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=816,576,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4254/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=816,768,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4255/500000] + train/ActionNoiseL2Loss=0.0919 + throughput/total_tokens=816,960,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4256/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=817,152,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4257/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=817,344,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4258/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=817,536,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4259/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=817,728,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4260/500000] + optim/total_grad_norm=1.426 + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=817,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=4261/500000] + train/ActionNoiseL2Loss=0.0979 + throughput/total_tokens=818,112,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4262/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=818,304,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4263/500000] + train/ActionNoiseL2Loss=0.1040 + throughput/total_tokens=818,496,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4264/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=818,688,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4265/500000] + train/ActionNoiseL2Loss=0.0982 + throughput/total_tokens=818,880,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4266/500000] + train/ActionNoiseL2Loss=0.0709 + throughput/total_tokens=819,072,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4267/500000] + train/ActionNoiseL2Loss=0.1007 + throughput/total_tokens=819,264,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4268/500000] + train/ActionNoiseL2Loss=0.1108 + throughput/total_tokens=819,456,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4269/500000] + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=819,648,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4270/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=819,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4271/500000] + train/ActionNoiseL2Loss=0.0996 + throughput/total_tokens=820,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4272/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=820,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4273/500000] + train/ActionNoiseL2Loss=0.1142 + throughput/total_tokens=820,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4274/500000] + train/ActionNoiseL2Loss=0.0958 + throughput/total_tokens=820,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4275/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=820,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4276/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=820,992,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4277/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=821,184,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4278/500000] + train/ActionNoiseL2Loss=0.1003 + throughput/total_tokens=821,376,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4279/500000] + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=821,568,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4280/500000] + optim/total_grad_norm=1.436 + train/ActionNoiseL2Loss=0.0920 + throughput/total_tokens=821,760,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4281/500000] + train/ActionNoiseL2Loss=0.0868 + throughput/total_tokens=821,952,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4282/500000] + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=822,144,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4283/500000] + train/ActionNoiseL2Loss=0.1008 + throughput/total_tokens=822,336,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4284/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=822,528,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4285/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=822,720,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4286/500000] + train/ActionNoiseL2Loss=0.0983 + throughput/total_tokens=822,912,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4287/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=823,104,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4288/500000] + train/ActionNoiseL2Loss=0.0923 + throughput/total_tokens=823,296,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4289/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=823,488,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4290/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=823,680,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4291/500000] + train/ActionNoiseL2Loss=0.1178 + throughput/total_tokens=823,872,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4292/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=824,064,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4293/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=824,256,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4294/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=824,448,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4295/500000] + train/ActionNoiseL2Loss=0.0838 + throughput/total_tokens=824,640,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4296/500000] + train/ActionNoiseL2Loss=0.1015 + throughput/total_tokens=824,832,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4297/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=825,024,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4298/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=825,216,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4299/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=825,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4300/500000] + optim/total_grad_norm=1.425 + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=825,600,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4301/500000] + train/ActionNoiseL2Loss=0.0391 + throughput/total_tokens=825,792,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4302/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=825,984,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4303/500000] + train/ActionNoiseL2Loss=0.0776 + throughput/total_tokens=826,176,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4304/500000] + train/ActionNoiseL2Loss=0.1183 + throughput/total_tokens=826,368,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4305/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=826,560,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4306/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=826,752,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4307/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=826,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4308/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=827,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4309/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=827,328,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4310/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=827,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=4311/500000] + train/ActionNoiseL2Loss=0.0935 + throughput/total_tokens=827,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4312/500000] + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=827,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4313/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=828,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4314/500000] + train/ActionNoiseL2Loss=0.1243 + throughput/total_tokens=828,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4315/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=828,480,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4316/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=828,672,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4317/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=828,864,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4318/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=829,056,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4319/500000] + train/ActionNoiseL2Loss=0.1021 + throughput/total_tokens=829,248,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4320/500000] + optim/total_grad_norm=1.171 + train/ActionNoiseL2Loss=0.0838 + throughput/total_tokens=829,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4321/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=829,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4322/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=829,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4323/500000] + train/ActionNoiseL2Loss=0.1087 + throughput/total_tokens=830,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4324/500000] + train/ActionNoiseL2Loss=0.1200 + throughput/total_tokens=830,208,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4325/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=830,400,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4326/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=830,592,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4327/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=830,784,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4328/500000] + train/ActionNoiseL2Loss=0.0940 + throughput/total_tokens=830,976,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4329/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=831,168,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4330/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=831,360,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4331/500000] + train/ActionNoiseL2Loss=0.0975 + throughput/total_tokens=831,552,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4332/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=831,744,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4333/500000] + train/ActionNoiseL2Loss=0.0902 + throughput/total_tokens=831,936,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4334/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=832,128,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4335/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=832,320,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4336/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=832,512,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4337/500000] + train/ActionNoiseL2Loss=0.1027 + throughput/total_tokens=832,704,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4338/500000] + train/ActionNoiseL2Loss=0.1158 + throughput/total_tokens=832,896,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4339/500000] + train/ActionNoiseL2Loss=0.0863 + throughput/total_tokens=833,088,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4340/500000] + optim/total_grad_norm=1.664 + train/ActionNoiseL2Loss=0.1028 + throughput/total_tokens=833,280,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4341/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=833,472,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4342/500000] + train/ActionNoiseL2Loss=0.0866 + throughput/total_tokens=833,664,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4343/500000] + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=833,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4344/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=834,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4345/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=834,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4346/500000] + train/ActionNoiseL2Loss=0.1020 + throughput/total_tokens=834,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4347/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=834,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4348/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=834,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4349/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=835,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4350/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=835,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4351/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=835,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4352/500000] + train/ActionNoiseL2Loss=0.1241 + throughput/total_tokens=835,584,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4353/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=835,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4354/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=835,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4355/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=836,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4356/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=836,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4357/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=836,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4358/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=836,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4359/500000] + train/ActionNoiseL2Loss=0.1276 + throughput/total_tokens=836,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4360/500000] + optim/total_grad_norm=1.022 + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=837,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=4361/500000] + train/ActionNoiseL2Loss=0.1075 + throughput/total_tokens=837,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4362/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=837,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4363/500000] + train/ActionNoiseL2Loss=0.0359 + throughput/total_tokens=837,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4364/500000] + train/ActionNoiseL2Loss=0.1087 + throughput/total_tokens=837,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4365/500000] + train/ActionNoiseL2Loss=0.1524 + throughput/total_tokens=838,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4366/500000] + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=838,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4367/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=838,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4368/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=838,656,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4369/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=838,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4370/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=839,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4371/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=839,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4372/500000] + train/ActionNoiseL2Loss=0.0900 + throughput/total_tokens=839,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4373/500000] + train/ActionNoiseL2Loss=0.0955 + throughput/total_tokens=839,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4374/500000] + train/ActionNoiseL2Loss=0.0361 + throughput/total_tokens=839,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4375/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=840,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4376/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=840,192,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4377/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=840,384,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4378/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=840,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4379/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=840,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4380/500000] + optim/total_grad_norm=1.065 + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=840,960,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4381/500000] + train/ActionNoiseL2Loss=0.1170 + throughput/total_tokens=841,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4382/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=841,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4383/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=841,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4384/500000] + train/ActionNoiseL2Loss=0.0709 + throughput/total_tokens=841,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4385/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=841,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4386/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=842,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4387/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=842,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4388/500000] + train/ActionNoiseL2Loss=0.1005 + throughput/total_tokens=842,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4389/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=842,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4390/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=842,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4391/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=843,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4392/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=843,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4393/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=843,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4394/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=843,648,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4395/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=843,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4396/500000] + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=844,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4397/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=844,224,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4398/500000] + train/ActionNoiseL2Loss=0.1211 + throughput/total_tokens=844,416,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4399/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=844,608,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=4400/500000] + optim/total_grad_norm=1.424 + train/ActionNoiseL2Loss=0.1042 + throughput/total_tokens=844,800,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4401/500000] + train/ActionNoiseL2Loss=0.0893 + throughput/total_tokens=844,992,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4402/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=845,184,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4403/500000] + train/ActionNoiseL2Loss=0.0387 + throughput/total_tokens=845,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4404/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=845,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4405/500000] + train/ActionNoiseL2Loss=0.0959 + throughput/total_tokens=845,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4406/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=845,952,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4407/500000] + train/ActionNoiseL2Loss=0.0892 + throughput/total_tokens=846,144,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4408/500000] + train/ActionNoiseL2Loss=0.1502 + throughput/total_tokens=846,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4409/500000] + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=846,528,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4410/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=846,720,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4411/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=846,912,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4412/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=847,104,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4413/500000] + train/ActionNoiseL2Loss=0.0972 + throughput/total_tokens=847,296,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4414/500000] + train/ActionNoiseL2Loss=0.1257 + throughput/total_tokens=847,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4415/500000] + train/ActionNoiseL2Loss=0.1265 + throughput/total_tokens=847,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4416/500000] + train/ActionNoiseL2Loss=0.1376 + throughput/total_tokens=847,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4417/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=848,064,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4418/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=848,256,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4419/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=848,448,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4420/500000] + optim/total_grad_norm=1.359 + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=848,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4421/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=848,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4422/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=849,024,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4423/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=849,216,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4424/500000] + train/ActionNoiseL2Loss=0.0831 + throughput/total_tokens=849,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4425/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=849,600,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4426/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=849,792,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4427/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=849,984,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4428/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=850,176,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4429/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=850,368,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4430/500000] + train/ActionNoiseL2Loss=0.0916 + throughput/total_tokens=850,560,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4431/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=850,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4432/500000] + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=850,944,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4433/500000] + train/ActionNoiseL2Loss=0.0969 + throughput/total_tokens=851,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4434/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=851,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4435/500000] + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=851,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4436/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=851,712,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4437/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=851,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4438/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=852,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4439/500000] + train/ActionNoiseL2Loss=0.0788 + throughput/total_tokens=852,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4440/500000] + optim/total_grad_norm=1.605 + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=852,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4441/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=852,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4442/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=852,864,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4443/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=853,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4444/500000] + train/ActionNoiseL2Loss=0.1316 + throughput/total_tokens=853,248,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4445/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=853,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4446/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=853,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4447/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=853,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4448/500000] + train/ActionNoiseL2Loss=0.0969 + throughput/total_tokens=854,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4449/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=854,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4450/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=854,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4451/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=854,592,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4452/500000] + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=854,784,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4453/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=854,976,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4454/500000] + train/ActionNoiseL2Loss=0.1016 + throughput/total_tokens=855,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4455/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=855,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4456/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=855,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4457/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=855,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4458/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=855,936,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4459/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=856,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4460/500000] + optim/total_grad_norm=1.128 + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=856,320,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=4461/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=856,512,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4462/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=856,704,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4463/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=856,896,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4464/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=857,088,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4465/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=857,280,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4466/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=857,472,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4467/500000] + train/ActionNoiseL2Loss=0.0269 + throughput/total_tokens=857,664,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4468/500000] + train/ActionNoiseL2Loss=0.1052 + throughput/total_tokens=857,856,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4469/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=858,048,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4470/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=858,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4471/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=858,432,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4472/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=858,624,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4473/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=858,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4474/500000] + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=859,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4475/500000] + train/ActionNoiseL2Loss=0.0826 + throughput/total_tokens=859,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4476/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=859,392,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4477/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=859,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4478/500000] + train/ActionNoiseL2Loss=0.0907 + throughput/total_tokens=859,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4479/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=859,968,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4480/500000] + optim/total_grad_norm=1.160 + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=860,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4481/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=860,352,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4482/500000] + train/ActionNoiseL2Loss=0.0788 + throughput/total_tokens=860,544,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4483/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=860,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4484/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=860,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4485/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=861,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4486/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=861,312,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4487/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=861,504,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4488/500000] + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=861,696,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4489/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=861,888,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4490/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=862,080,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4491/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=862,272,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4492/500000] + train/ActionNoiseL2Loss=0.0294 + throughput/total_tokens=862,464,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4493/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=862,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4494/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=862,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4495/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=863,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4496/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=863,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4497/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=863,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4498/500000] + train/ActionNoiseL2Loss=0.1346 + throughput/total_tokens=863,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4499/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=863,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4500/500000] + optim/total_grad_norm=1.165 + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=864,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +10/12 [19:28:27] INFO | >> Saving config... checkpoint.py:608 +10/12 [19:29:00] INFO | >> Saving model state... checkpoint.py:796 +10/12 [19:30:10] INFO | >> Saving optim state... checkpoint.py:811 +10/12 [19:31:41] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=4501/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=864,192,000 + throughput/device/tokens_per_second=1,130 + throughput/device/batches_per_second=0.0471 +[step=4502/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=864,384,000 + throughput/device/tokens_per_second=1,130 + throughput/device/batches_per_second=0.0471 +[step=4503/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=864,576,000 + throughput/device/tokens_per_second=1,132 + throughput/device/batches_per_second=0.0472 +[step=4504/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=864,768,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=4505/500000] + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=864,960,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=4506/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=865,152,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=4507/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=865,344,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=4508/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=865,536,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=4509/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=865,728,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=4510/500000] + train/ActionNoiseL2Loss=0.0907 + throughput/total_tokens=865,920,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=4511/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=866,112,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4512/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=866,304,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4513/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=866,496,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4514/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=866,688,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4515/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=866,880,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4516/500000] + train/ActionNoiseL2Loss=0.0790 + throughput/total_tokens=867,072,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4517/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=867,264,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4518/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=867,456,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4519/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=867,648,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4520/500000] + optim/total_grad_norm=0.8513 + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=867,840,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=4521/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=868,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4522/500000] + train/ActionNoiseL2Loss=0.1150 + throughput/total_tokens=868,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4523/500000] + train/ActionNoiseL2Loss=0.0391 + throughput/total_tokens=868,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4524/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=868,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4525/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=868,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4526/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=868,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4527/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=869,184,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4528/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=869,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4529/500000] + train/ActionNoiseL2Loss=0.0838 + throughput/total_tokens=869,568,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4530/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=869,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4531/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=869,952,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4532/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=870,144,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4533/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=870,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4534/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=870,528,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4535/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=870,720,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4536/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=870,912,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4537/500000] + train/ActionNoiseL2Loss=0.0895 + throughput/total_tokens=871,104,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4538/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=871,296,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4539/500000] + train/ActionNoiseL2Loss=0.0876 + throughput/total_tokens=871,488,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4540/500000] + optim/total_grad_norm=0.8653 + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=871,680,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4541/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=871,872,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4542/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=872,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4543/500000] + train/ActionNoiseL2Loss=0.0843 + throughput/total_tokens=872,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4544/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=872,448,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4545/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=872,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4546/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=872,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4547/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=873,024,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4548/500000] + train/ActionNoiseL2Loss=0.1164 + throughput/total_tokens=873,216,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4549/500000] + train/ActionNoiseL2Loss=0.0988 + throughput/total_tokens=873,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4550/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=873,600,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4551/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=873,792,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4552/500000] + train/ActionNoiseL2Loss=0.1408 + throughput/total_tokens=873,984,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4553/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=874,176,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4554/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=874,368,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4555/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=874,560,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4556/500000] + train/ActionNoiseL2Loss=0.0863 + throughput/total_tokens=874,752,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4557/500000] + train/ActionNoiseL2Loss=0.0934 + throughput/total_tokens=874,944,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4558/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=875,136,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4559/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=875,328,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4560/500000] + optim/total_grad_norm=1.170 + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=875,520,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=4561/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=875,712,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4562/500000] + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=875,904,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4563/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=876,096,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4564/500000] + train/ActionNoiseL2Loss=0.1653 + throughput/total_tokens=876,288,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4565/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=876,480,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4566/500000] + train/ActionNoiseL2Loss=0.0888 + throughput/total_tokens=876,672,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4567/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=876,864,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4568/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=877,056,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4569/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=877,248,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4570/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=877,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4571/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=877,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4572/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=877,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4573/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=878,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4574/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=878,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4575/500000] + train/ActionNoiseL2Loss=0.1116 + throughput/total_tokens=878,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4576/500000] + train/ActionNoiseL2Loss=0.0271 + throughput/total_tokens=878,592,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4577/500000] + train/ActionNoiseL2Loss=0.0244 + throughput/total_tokens=878,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4578/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=878,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4579/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=879,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4580/500000] + optim/total_grad_norm=0.6360 + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=879,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4581/500000] + train/ActionNoiseL2Loss=0.0994 + throughput/total_tokens=879,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4582/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=879,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4583/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=879,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4584/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=880,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4585/500000] + train/ActionNoiseL2Loss=0.0318 + throughput/total_tokens=880,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4586/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=880,512,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4587/500000] + train/ActionNoiseL2Loss=0.1433 + throughput/total_tokens=880,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4588/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=880,896,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4589/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=881,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4590/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=881,280,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4591/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=881,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4592/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=881,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4593/500000] + train/ActionNoiseL2Loss=0.1151 + throughput/total_tokens=881,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4594/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=882,048,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4595/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=882,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4596/500000] + train/ActionNoiseL2Loss=0.0831 + throughput/total_tokens=882,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4597/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=882,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4598/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=882,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4599/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=883,008,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4600/500000] + optim/total_grad_norm=0.6583 + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=883,200,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4601/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=883,392,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4602/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=883,584,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4603/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=883,776,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4604/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=883,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4605/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=884,160,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4606/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=884,352,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4607/500000] + train/ActionNoiseL2Loss=0.0258 + throughput/total_tokens=884,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4608/500000] + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=884,736,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4609/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=884,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4610/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=885,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=4611/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=885,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4612/500000] + train/ActionNoiseL2Loss=0.1155 + throughput/total_tokens=885,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4613/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=885,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4614/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=885,888,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4615/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=886,080,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4616/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=886,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4617/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=886,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4618/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=886,656,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4619/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=886,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4620/500000] + optim/total_grad_norm=0.8445 + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=887,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4621/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=887,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4622/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=887,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4623/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=887,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4624/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=887,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4625/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=888,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4626/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=888,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4627/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=888,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4628/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=888,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4629/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=888,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4630/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=888,960,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4631/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=889,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4632/500000] + train/ActionNoiseL2Loss=0.1228 + throughput/total_tokens=889,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4633/500000] + train/ActionNoiseL2Loss=0.0863 + throughput/total_tokens=889,536,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4634/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=889,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4635/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=889,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4636/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=890,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4637/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=890,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4638/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=890,496,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4639/500000] + train/ActionNoiseL2Loss=0.1039 + throughput/total_tokens=890,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4640/500000] + optim/total_grad_norm=0.9800 + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=890,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4641/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=891,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4642/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=891,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4643/500000] + train/ActionNoiseL2Loss=0.0252 + throughput/total_tokens=891,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4644/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=891,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4645/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=891,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4646/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=892,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4647/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=892,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4648/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=892,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4649/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=892,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4650/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=892,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4651/500000] + train/ActionNoiseL2Loss=0.1021 + throughput/total_tokens=892,992,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4652/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=893,184,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4653/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=893,376,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4654/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=893,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4655/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=893,760,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4656/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=893,952,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4657/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=894,144,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4658/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=894,336,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4659/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=894,528,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4660/500000] + optim/total_grad_norm=1.276 + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=894,720,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=4661/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=894,912,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4662/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=895,104,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4663/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=895,296,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4664/500000] + train/ActionNoiseL2Loss=0.1358 + throughput/total_tokens=895,488,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4665/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=895,680,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4666/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=895,872,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4667/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=896,064,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4668/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=896,256,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4669/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=896,448,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4670/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=896,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4671/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=896,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4672/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=897,024,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4673/500000] + train/ActionNoiseL2Loss=0.0310 + throughput/total_tokens=897,216,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4674/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=897,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4675/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=897,600,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4676/500000] + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=897,792,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4677/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=897,984,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4678/500000] + train/ActionNoiseL2Loss=0.1061 + throughput/total_tokens=898,176,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4679/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=898,368,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4680/500000] + optim/total_grad_norm=0.9517 + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=898,560,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=4681/500000] + train/ActionNoiseL2Loss=0.1025 + throughput/total_tokens=898,752,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4682/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=898,944,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4683/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=899,136,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4684/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=899,328,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4685/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=899,520,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4686/500000] + train/ActionNoiseL2Loss=0.0946 + throughput/total_tokens=899,712,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4687/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=899,904,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4688/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=900,096,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4689/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=900,288,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4690/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=900,480,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4691/500000] + train/ActionNoiseL2Loss=0.0924 + throughput/total_tokens=900,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4692/500000] + train/ActionNoiseL2Loss=0.1069 + throughput/total_tokens=900,864,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4693/500000] + train/ActionNoiseL2Loss=0.1118 + throughput/total_tokens=901,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4694/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=901,248,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4695/500000] + train/ActionNoiseL2Loss=0.0877 + throughput/total_tokens=901,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4696/500000] + train/ActionNoiseL2Loss=0.0820 + throughput/total_tokens=901,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4697/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=901,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4698/500000] + train/ActionNoiseL2Loss=0.1000 + throughput/total_tokens=902,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4699/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=902,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4700/500000] + optim/total_grad_norm=1.086 + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=902,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4701/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=902,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4702/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=902,784,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4703/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=902,976,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4704/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=903,168,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4705/500000] + train/ActionNoiseL2Loss=0.0979 + throughput/total_tokens=903,360,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4706/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=903,552,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4707/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=903,744,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4708/500000] + train/ActionNoiseL2Loss=0.1051 + throughput/total_tokens=903,936,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4709/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=904,128,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4710/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=904,320,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=4711/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=904,512,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4712/500000] + train/ActionNoiseL2Loss=0.0998 + throughput/total_tokens=904,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4713/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=904,896,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4714/500000] + train/ActionNoiseL2Loss=0.0919 + throughput/total_tokens=905,088,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4715/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=905,280,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4716/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=905,472,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4717/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=905,664,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4718/500000] + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=905,856,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4719/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=906,048,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4720/500000] + optim/total_grad_norm=1.318 + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=906,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4721/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=906,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4722/500000] + train/ActionNoiseL2Loss=0.1525 + throughput/total_tokens=906,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4723/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=906,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4724/500000] + train/ActionNoiseL2Loss=0.0836 + throughput/total_tokens=907,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4725/500000] + train/ActionNoiseL2Loss=0.1167 + throughput/total_tokens=907,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4726/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=907,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4727/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=907,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4728/500000] + train/ActionNoiseL2Loss=0.1052 + throughput/total_tokens=907,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4729/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=907,968,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4730/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=908,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4731/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=908,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4732/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=908,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4733/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=908,736,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4734/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=908,928,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4735/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=909,120,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4736/500000] + train/ActionNoiseL2Loss=0.0298 + throughput/total_tokens=909,312,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4737/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=909,504,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4738/500000] + train/ActionNoiseL2Loss=0.0921 + throughput/total_tokens=909,696,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4739/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=909,888,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4740/500000] + optim/total_grad_norm=0.9830 + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=910,080,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4741/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=910,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4742/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=910,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4743/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=910,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4744/500000] + train/ActionNoiseL2Loss=0.0962 + throughput/total_tokens=910,848,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4745/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=911,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4746/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=911,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4747/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=911,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4748/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=911,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4749/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=911,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4750/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=912,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4751/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=912,192,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4752/500000] + train/ActionNoiseL2Loss=0.0919 + throughput/total_tokens=912,384,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4753/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=912,576,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4754/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=912,768,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4755/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=912,960,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4756/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=913,152,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4757/500000] + train/ActionNoiseL2Loss=0.1089 + throughput/total_tokens=913,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4758/500000] + train/ActionNoiseL2Loss=0.0878 + throughput/total_tokens=913,536,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4759/500000] + train/ActionNoiseL2Loss=0.0866 + throughput/total_tokens=913,728,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4760/500000] + optim/total_grad_norm=1.281 + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=913,920,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=4761/500000] + train/ActionNoiseL2Loss=0.0833 + throughput/total_tokens=914,112,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4762/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=914,304,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4763/500000] + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=914,496,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4764/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=914,688,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4765/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=914,880,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4766/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=915,072,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4767/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=915,264,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4768/500000] + train/ActionNoiseL2Loss=0.0339 + throughput/total_tokens=915,456,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4769/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=915,648,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4770/500000] + train/ActionNoiseL2Loss=0.0973 + throughput/total_tokens=915,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4771/500000] + train/ActionNoiseL2Loss=0.1163 + throughput/total_tokens=916,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4772/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=916,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4773/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=916,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4774/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=916,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4775/500000] + train/ActionNoiseL2Loss=0.0923 + throughput/total_tokens=916,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4776/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=916,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4777/500000] + train/ActionNoiseL2Loss=0.1191 + throughput/total_tokens=917,184,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4778/500000] + train/ActionNoiseL2Loss=0.1230 + throughput/total_tokens=917,376,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4779/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=917,568,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4780/500000] + optim/total_grad_norm=1.401 + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=917,760,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4781/500000] + train/ActionNoiseL2Loss=0.1496 + throughput/total_tokens=917,952,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4782/500000] + train/ActionNoiseL2Loss=0.0942 + throughput/total_tokens=918,144,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4783/500000] + train/ActionNoiseL2Loss=0.1195 + throughput/total_tokens=918,336,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4784/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=918,528,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4785/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=918,720,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4786/500000] + train/ActionNoiseL2Loss=0.0709 + throughput/total_tokens=918,912,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4787/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=919,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4788/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=919,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4789/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=919,488,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4790/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=919,680,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4791/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=919,872,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4792/500000] + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=920,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4793/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=920,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4794/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=920,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4795/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=920,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4796/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=920,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4797/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=921,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4798/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=921,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4799/500000] + train/ActionNoiseL2Loss=0.1120 + throughput/total_tokens=921,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4800/500000] + optim/total_grad_norm=1.620 + train/ActionNoiseL2Loss=0.0894 + throughput/total_tokens=921,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4801/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=921,792,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4802/500000] + train/ActionNoiseL2Loss=0.1109 + throughput/total_tokens=921,984,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4803/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=922,176,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4804/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=922,368,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4805/500000] + train/ActionNoiseL2Loss=0.0951 + throughput/total_tokens=922,560,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4806/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=922,752,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4807/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=922,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4808/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=923,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4809/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=923,328,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4810/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=923,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=4811/500000] + train/ActionNoiseL2Loss=0.0879 + throughput/total_tokens=923,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4812/500000] + train/ActionNoiseL2Loss=0.1043 + throughput/total_tokens=923,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4813/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=924,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4814/500000] + train/ActionNoiseL2Loss=0.1296 + throughput/total_tokens=924,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4815/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=924,480,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4816/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=924,672,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4817/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=924,864,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4818/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=925,056,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4819/500000] + train/ActionNoiseL2Loss=0.1146 + throughput/total_tokens=925,248,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4820/500000] + optim/total_grad_norm=1.194 + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=925,440,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4821/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=925,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4822/500000] + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=925,824,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4823/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=926,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4824/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=926,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4825/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=926,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4826/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=926,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4827/500000] + train/ActionNoiseL2Loss=0.0325 + throughput/total_tokens=926,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4828/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=926,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4829/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=927,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4830/500000] + train/ActionNoiseL2Loss=0.1521 + throughput/total_tokens=927,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4831/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=927,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4832/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=927,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4833/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=927,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4834/500000] + train/ActionNoiseL2Loss=0.1064 + throughput/total_tokens=928,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4835/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=928,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4836/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=928,512,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4837/500000] + train/ActionNoiseL2Loss=0.1079 + throughput/total_tokens=928,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4838/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=928,896,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4839/500000] + train/ActionNoiseL2Loss=0.0802 + throughput/total_tokens=929,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4840/500000] + optim/total_grad_norm=0.8978 + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=929,280,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4841/500000] + train/ActionNoiseL2Loss=0.0968 + throughput/total_tokens=929,472,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4842/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=929,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4843/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=929,856,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4844/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=930,048,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4845/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=930,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4846/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=930,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4847/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=930,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4848/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=930,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4849/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=931,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4850/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=931,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4851/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=931,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4852/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=931,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4853/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=931,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4854/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=931,968,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4855/500000] + train/ActionNoiseL2Loss=0.0966 + throughput/total_tokens=932,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4856/500000] + train/ActionNoiseL2Loss=0.0836 + throughput/total_tokens=932,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4857/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=932,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4858/500000] + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=932,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4859/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=932,928,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4860/500000] + optim/total_grad_norm=2.294 + train/ActionNoiseL2Loss=0.1833 + throughput/total_tokens=933,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=4861/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=933,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4862/500000] + train/ActionNoiseL2Loss=0.1036 + throughput/total_tokens=933,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4863/500000] + train/ActionNoiseL2Loss=0.0877 + throughput/total_tokens=933,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4864/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=933,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4865/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=934,080,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4866/500000] + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=934,272,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4867/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=934,464,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4868/500000] + train/ActionNoiseL2Loss=0.0980 + throughput/total_tokens=934,656,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4869/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=934,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4870/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=935,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4871/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=935,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4872/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=935,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4873/500000] + train/ActionNoiseL2Loss=0.1075 + throughput/total_tokens=935,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4874/500000] + train/ActionNoiseL2Loss=0.1174 + throughput/total_tokens=935,808,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4875/500000] + train/ActionNoiseL2Loss=0.0909 + throughput/total_tokens=936,000,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4876/500000] + train/ActionNoiseL2Loss=0.0874 + throughput/total_tokens=936,192,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4877/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=936,384,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4878/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=936,576,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4879/500000] + train/ActionNoiseL2Loss=0.1104 + throughput/total_tokens=936,768,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4880/500000] + optim/total_grad_norm=0.8500 + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=936,960,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4881/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=937,152,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4882/500000] + train/ActionNoiseL2Loss=0.0752 + throughput/total_tokens=937,344,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4883/500000] + train/ActionNoiseL2Loss=0.0949 + throughput/total_tokens=937,536,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4884/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=937,728,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4885/500000] + train/ActionNoiseL2Loss=0.1103 + throughput/total_tokens=937,920,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4886/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=938,112,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4887/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=938,304,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4888/500000] + train/ActionNoiseL2Loss=0.0901 + throughput/total_tokens=938,496,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4889/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=938,688,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4890/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=938,880,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=4891/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=939,072,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=4892/500000] + train/ActionNoiseL2Loss=0.0411 + throughput/total_tokens=939,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4893/500000] + train/ActionNoiseL2Loss=0.1145 + throughput/total_tokens=939,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4894/500000] + train/ActionNoiseL2Loss=0.1388 + throughput/total_tokens=939,648,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4895/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=939,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4896/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=940,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4897/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=940,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4898/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=940,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4899/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=940,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4900/500000] + optim/total_grad_norm=1.280 + train/ActionNoiseL2Loss=0.1063 + throughput/total_tokens=940,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4901/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=940,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4902/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=941,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4903/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=941,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4904/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=941,568,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4905/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=941,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4906/500000] + train/ActionNoiseL2Loss=0.1050 + throughput/total_tokens=941,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4907/500000] + train/ActionNoiseL2Loss=0.1113 + throughput/total_tokens=942,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4908/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=942,336,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4909/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=942,528,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4910/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=942,720,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=4911/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=942,912,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4912/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=943,104,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4913/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=943,296,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4914/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=943,488,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4915/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=943,680,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4916/500000] + train/ActionNoiseL2Loss=0.1089 + throughput/total_tokens=943,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=4917/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=944,064,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4918/500000] + train/ActionNoiseL2Loss=0.1074 + throughput/total_tokens=944,256,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4919/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=944,448,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4920/500000] + optim/total_grad_norm=1.077 + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=944,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4921/500000] + train/ActionNoiseL2Loss=0.1009 + throughput/total_tokens=944,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4922/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=945,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4923/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=945,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4924/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=945,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4925/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=945,600,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4926/500000] + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=945,792,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4927/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=945,984,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4928/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=946,176,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4929/500000] + train/ActionNoiseL2Loss=0.0961 + throughput/total_tokens=946,368,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4930/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=946,560,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4931/500000] + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=946,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4932/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=946,944,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4933/500000] + train/ActionNoiseL2Loss=0.1200 + throughput/total_tokens=947,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4934/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=947,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4935/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=947,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4936/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=947,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4937/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=947,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4938/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=948,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4939/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=948,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4940/500000] + optim/total_grad_norm=0.8499 + train/ActionNoiseL2Loss=0.0942 + throughput/total_tokens=948,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4941/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=948,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4942/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=948,864,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4943/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=949,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4944/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=949,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4945/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=949,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4946/500000] + train/ActionNoiseL2Loss=0.0776 + throughput/total_tokens=949,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=4947/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=949,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4948/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=950,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4949/500000] + train/ActionNoiseL2Loss=0.1374 + throughput/total_tokens=950,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4950/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=950,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4951/500000] + train/ActionNoiseL2Loss=0.0236 + throughput/total_tokens=950,592,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4952/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=950,784,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4953/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=950,976,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4954/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=951,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4955/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=951,360,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4956/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=951,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4957/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=951,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4958/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=951,936,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4959/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=952,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4960/500000] + optim/total_grad_norm=1.259 + train/ActionNoiseL2Loss=0.1229 + throughput/total_tokens=952,320,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=4961/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=952,512,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4962/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=952,704,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4963/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=952,896,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4964/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=953,088,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4965/500000] + train/ActionNoiseL2Loss=0.1104 + throughput/total_tokens=953,280,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4966/500000] + train/ActionNoiseL2Loss=0.0903 + throughput/total_tokens=953,472,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4967/500000] + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=953,664,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4968/500000] + train/ActionNoiseL2Loss=0.1085 + throughput/total_tokens=953,856,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4969/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=954,048,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=4970/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=954,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4971/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=954,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4972/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=954,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4973/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=954,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4974/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=955,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4975/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=955,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4976/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=955,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4977/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=955,584,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4978/500000] + train/ActionNoiseL2Loss=0.0261 + throughput/total_tokens=955,776,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4979/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=955,968,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4980/500000] + optim/total_grad_norm=2.074 + train/ActionNoiseL2Loss=0.0915 + throughput/total_tokens=956,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4981/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=956,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4982/500000] + train/ActionNoiseL2Loss=0.0893 + throughput/total_tokens=956,544,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4983/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=956,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4984/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=956,928,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4985/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=957,120,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4986/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=957,312,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4987/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=957,504,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4988/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=957,696,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4989/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=957,888,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4990/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=958,080,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=4991/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=958,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4992/500000] + train/ActionNoiseL2Loss=0.1001 + throughput/total_tokens=958,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4993/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=958,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4994/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=958,848,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4995/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=959,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4996/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=959,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4997/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=959,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=4998/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=959,616,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=4999/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=959,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5000/500000] + optim/total_grad_norm=1.806 + train/ActionNoiseL2Loss=0.1045 + throughput/total_tokens=960,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +10/12 [22:27:26] INFO | >> Saving config... checkpoint.py:608 +10/12 [22:28:14] INFO | >> Saving model state... checkpoint.py:796 +10/12 [22:29:26] INFO | >> Saving optim state... checkpoint.py:811 +10/12 [22:30:56] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=5001/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=960,192,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=5002/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=960,384,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=5003/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=960,576,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=5004/500000] + train/ActionNoiseL2Loss=0.1042 + throughput/total_tokens=960,768,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=5005/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=960,960,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=5006/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=961,152,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5007/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=961,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5008/500000] + train/ActionNoiseL2Loss=0.1532 + throughput/total_tokens=961,536,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5009/500000] + train/ActionNoiseL2Loss=0.0961 + throughput/total_tokens=961,728,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5010/500000] + train/ActionNoiseL2Loss=0.0921 + throughput/total_tokens=961,920,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=5011/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=962,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5012/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=962,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5013/500000] + train/ActionNoiseL2Loss=0.1403 + throughput/total_tokens=962,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5014/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=962,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5015/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=962,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5016/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=963,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5017/500000] + train/ActionNoiseL2Loss=0.0995 + throughput/total_tokens=963,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5018/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=963,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5019/500000] + train/ActionNoiseL2Loss=0.0741 + throughput/total_tokens=963,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5020/500000] + optim/total_grad_norm=1.002 + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=963,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5021/500000] + train/ActionNoiseL2Loss=0.1036 + throughput/total_tokens=964,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5022/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=964,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5023/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=964,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5024/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=964,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5025/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=964,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5026/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=964,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5027/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=965,184,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5028/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=965,376,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5029/500000] + train/ActionNoiseL2Loss=0.0907 + throughput/total_tokens=965,568,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5030/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=965,760,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5031/500000] + train/ActionNoiseL2Loss=0.1032 + throughput/total_tokens=965,952,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5032/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=966,144,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5033/500000] + train/ActionNoiseL2Loss=0.1080 + throughput/total_tokens=966,336,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5034/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=966,528,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5035/500000] + train/ActionNoiseL2Loss=0.0924 + throughput/total_tokens=966,720,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5036/500000] + train/ActionNoiseL2Loss=0.0747 + throughput/total_tokens=966,912,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5037/500000] + train/ActionNoiseL2Loss=0.0881 + throughput/total_tokens=967,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5038/500000] + train/ActionNoiseL2Loss=0.1103 + throughput/total_tokens=967,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5039/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=967,488,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5040/500000] + optim/total_grad_norm=1.117 + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=967,680,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5041/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=967,872,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5042/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=968,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5043/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=968,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5044/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=968,448,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5045/500000] + train/ActionNoiseL2Loss=0.0961 + throughput/total_tokens=968,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5046/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=968,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5047/500000] + train/ActionNoiseL2Loss=0.1080 + throughput/total_tokens=969,024,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5048/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=969,216,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5049/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=969,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5050/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=969,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5051/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=969,792,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5052/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=969,984,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5053/500000] + train/ActionNoiseL2Loss=0.0845 + throughput/total_tokens=970,176,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5054/500000] + train/ActionNoiseL2Loss=0.0910 + throughput/total_tokens=970,368,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5055/500000] + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=970,560,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5056/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=970,752,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5057/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=970,944,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5058/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=971,136,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5059/500000] + train/ActionNoiseL2Loss=0.0387 + throughput/total_tokens=971,328,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5060/500000] + optim/total_grad_norm=1.222 + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=971,520,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=5061/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=971,712,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5062/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=971,904,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5063/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=972,096,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5064/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=972,288,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5065/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=972,480,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5066/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=972,672,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5067/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=972,864,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5068/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=973,056,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5069/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=973,248,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5070/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=973,440,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5071/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=973,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5072/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=973,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5073/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=974,016,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=5074/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=974,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5075/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=974,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5076/500000] + train/ActionNoiseL2Loss=0.1006 + throughput/total_tokens=974,592,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=5077/500000] + train/ActionNoiseL2Loss=0.0316 + throughput/total_tokens=974,784,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5078/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=974,976,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5079/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=975,168,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5080/500000] + optim/total_grad_norm=0.8469 + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=975,360,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5081/500000] + train/ActionNoiseL2Loss=0.0848 + throughput/total_tokens=975,552,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5082/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=975,744,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5083/500000] + train/ActionNoiseL2Loss=0.0848 + throughput/total_tokens=975,936,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5084/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=976,128,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5085/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=976,320,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5086/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=976,512,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5087/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=976,704,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5088/500000] + train/ActionNoiseL2Loss=0.1009 + throughput/total_tokens=976,896,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5089/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=977,088,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5090/500000] + train/ActionNoiseL2Loss=0.1131 + throughput/total_tokens=977,280,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5091/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=977,472,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5092/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=977,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5093/500000] + train/ActionNoiseL2Loss=0.1421 + throughput/total_tokens=977,856,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5094/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=978,048,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5095/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=978,240,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5096/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=978,432,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5097/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=978,624,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5098/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=978,816,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5099/500000] + train/ActionNoiseL2Loss=0.0927 + throughput/total_tokens=979,008,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5100/500000] + optim/total_grad_norm=1.530 + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=979,200,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5101/500000] + train/ActionNoiseL2Loss=0.0792 + throughput/total_tokens=979,392,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5102/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=979,584,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5103/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=979,776,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5104/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=979,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5105/500000] + train/ActionNoiseL2Loss=0.0923 + throughput/total_tokens=980,160,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5106/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=980,352,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5107/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=980,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5108/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=980,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5109/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=980,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5110/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=981,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=5111/500000] + train/ActionNoiseL2Loss=0.0709 + throughput/total_tokens=981,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5112/500000] + train/ActionNoiseL2Loss=0.0359 + throughput/total_tokens=981,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5113/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=981,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5114/500000] + train/ActionNoiseL2Loss=0.0976 + throughput/total_tokens=981,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5115/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=982,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5116/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=982,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5117/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=982,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5118/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=982,656,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5119/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=982,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5120/500000] + optim/total_grad_norm=0.6695 + train/ActionNoiseL2Loss=0.0287 + throughput/total_tokens=983,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5121/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=983,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5122/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=983,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5123/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=983,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5124/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=983,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5125/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=984,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5126/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=984,192,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5127/500000] + train/ActionNoiseL2Loss=0.0978 + throughput/total_tokens=984,384,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5128/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=984,576,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5129/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=984,768,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5130/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=984,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5131/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=985,152,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5132/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=985,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5133/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=985,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5134/500000] + train/ActionNoiseL2Loss=0.1125 + throughput/total_tokens=985,728,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5135/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=985,920,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5136/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=986,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5137/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=986,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5138/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=986,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5139/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=986,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5140/500000] + optim/total_grad_norm=1.112 + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=986,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5141/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=987,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5142/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=987,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5143/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=987,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5144/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=987,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5145/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=987,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5146/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=988,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5147/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=988,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5148/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=988,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5149/500000] + train/ActionNoiseL2Loss=0.0851 + throughput/total_tokens=988,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5150/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=988,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5151/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=988,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5152/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=989,184,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5153/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=989,376,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5154/500000] + train/ActionNoiseL2Loss=0.0845 + throughput/total_tokens=989,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5155/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=989,760,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5156/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=989,952,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5157/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=990,144,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5158/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=990,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5159/500000] + train/ActionNoiseL2Loss=0.0898 + throughput/total_tokens=990,528,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5160/500000] + optim/total_grad_norm=0.8986 + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=990,720,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=5161/500000] + train/ActionNoiseL2Loss=0.0949 + throughput/total_tokens=990,912,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5162/500000] + train/ActionNoiseL2Loss=0.0878 + throughput/total_tokens=991,104,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5163/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=991,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5164/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=991,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5165/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=991,680,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5166/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=991,872,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5167/500000] + train/ActionNoiseL2Loss=0.0874 + throughput/total_tokens=992,064,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5168/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=992,256,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5169/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=992,448,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5170/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=992,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5171/500000] + train/ActionNoiseL2Loss=0.0823 + throughput/total_tokens=992,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5172/500000] + train/ActionNoiseL2Loss=0.0998 + throughput/total_tokens=993,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5173/500000] + train/ActionNoiseL2Loss=0.1093 + throughput/total_tokens=993,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5174/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=993,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5175/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=993,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5176/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=993,792,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5177/500000] + train/ActionNoiseL2Loss=0.1085 + throughput/total_tokens=993,984,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5178/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=994,176,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5179/500000] + train/ActionNoiseL2Loss=0.0995 + throughput/total_tokens=994,368,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5180/500000] + optim/total_grad_norm=0.9015 + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=994,560,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5181/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=994,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5182/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=994,944,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5183/500000] + train/ActionNoiseL2Loss=0.0790 + throughput/total_tokens=995,136,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5184/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=995,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5185/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=995,520,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5186/500000] + train/ActionNoiseL2Loss=0.0343 + throughput/total_tokens=995,712,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5187/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=995,904,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5188/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=996,096,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5189/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=996,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5190/500000] + train/ActionNoiseL2Loss=0.0992 + throughput/total_tokens=996,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5191/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=996,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5192/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=996,864,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5193/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=997,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5194/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=997,248,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5195/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=997,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5196/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=997,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5197/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=997,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5198/500000] + train/ActionNoiseL2Loss=0.1070 + throughput/total_tokens=998,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5199/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=998,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5200/500000] + optim/total_grad_norm=0.9912 + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=998,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5201/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=998,592,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5202/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=998,784,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5203/500000] + train/ActionNoiseL2Loss=0.0957 + throughput/total_tokens=998,976,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5204/500000] + train/ActionNoiseL2Loss=0.1443 + throughput/total_tokens=999,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5205/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=999,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5206/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=999,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5207/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=999,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5208/500000] + train/ActionNoiseL2Loss=0.0776 + throughput/total_tokens=999,936,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5209/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=1,000,128,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5210/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=1,000,320,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=5211/500000] + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=1,000,512,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5212/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=1,000,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5213/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=1,000,896,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5214/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,001,088,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5215/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=1,001,280,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5216/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,001,472,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5217/500000] + train/ActionNoiseL2Loss=0.1436 + throughput/total_tokens=1,001,664,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5218/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,001,856,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5219/500000] + train/ActionNoiseL2Loss=0.1390 + throughput/total_tokens=1,002,048,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5220/500000] + optim/total_grad_norm=0.9795 + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,002,240,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5221/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=1,002,432,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=5222/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=1,002,624,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5223/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=1,002,816,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5224/500000] + train/ActionNoiseL2Loss=0.0865 + throughput/total_tokens=1,003,008,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5225/500000] + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=1,003,200,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5226/500000] + train/ActionNoiseL2Loss=0.1015 + throughput/total_tokens=1,003,392,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5227/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,003,584,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5228/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=1,003,776,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5229/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,003,968,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5230/500000] + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=1,004,160,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5231/500000] + train/ActionNoiseL2Loss=0.1008 + throughput/total_tokens=1,004,352,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5232/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=1,004,544,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5233/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,004,736,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5234/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,004,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5235/500000] + train/ActionNoiseL2Loss=0.0905 + throughput/total_tokens=1,005,120,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5236/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,005,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5237/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=1,005,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5238/500000] + train/ActionNoiseL2Loss=0.0995 + throughput/total_tokens=1,005,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5239/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=1,005,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5240/500000] + optim/total_grad_norm=1.074 + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=1,006,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5241/500000] + train/ActionNoiseL2Loss=0.0962 + throughput/total_tokens=1,006,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5242/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,006,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5243/500000] + train/ActionNoiseL2Loss=0.0866 + throughput/total_tokens=1,006,656,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5244/500000] + train/ActionNoiseL2Loss=0.1044 + throughput/total_tokens=1,006,848,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5245/500000] + train/ActionNoiseL2Loss=0.0338 + throughput/total_tokens=1,007,040,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5246/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=1,007,232,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5247/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,007,424,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5248/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=1,007,616,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5249/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,007,808,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5250/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,008,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5251/500000] + train/ActionNoiseL2Loss=0.1246 + throughput/total_tokens=1,008,192,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5252/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=1,008,384,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5253/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=1,008,576,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5254/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,008,768,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5255/500000] + train/ActionNoiseL2Loss=0.0922 + throughput/total_tokens=1,008,960,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5256/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=1,009,152,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5257/500000] + train/ActionNoiseL2Loss=0.0251 + throughput/total_tokens=1,009,344,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5258/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,009,536,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5259/500000] + train/ActionNoiseL2Loss=0.1029 + throughput/total_tokens=1,009,728,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5260/500000] + optim/total_grad_norm=1.234 + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,009,920,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=5261/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,010,112,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5262/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=1,010,304,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5263/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=1,010,496,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5264/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,010,688,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5265/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=1,010,880,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5266/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,011,072,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5267/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,011,264,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5268/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=1,011,456,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5269/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,011,648,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5270/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=1,011,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5271/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,012,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5272/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=1,012,224,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5273/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,012,416,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5274/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,012,608,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5275/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,012,800,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5276/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,012,992,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5277/500000] + train/ActionNoiseL2Loss=0.0959 + throughput/total_tokens=1,013,184,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5278/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=1,013,376,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5279/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,013,568,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5280/500000] + optim/total_grad_norm=1.362 + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=1,013,760,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=5281/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,013,952,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5282/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,014,144,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5283/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,014,336,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5284/500000] + train/ActionNoiseL2Loss=0.1137 + throughput/total_tokens=1,014,528,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5285/500000] + train/ActionNoiseL2Loss=0.0969 + throughput/total_tokens=1,014,720,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5286/500000] + train/ActionNoiseL2Loss=0.0905 + throughput/total_tokens=1,014,912,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5287/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=1,015,104,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5288/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,015,296,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5289/500000] + train/ActionNoiseL2Loss=0.1076 + throughput/total_tokens=1,015,488,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5290/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,015,680,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5291/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,015,872,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5292/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=1,016,064,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5293/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,016,256,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5294/500000] + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=1,016,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5295/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,016,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5296/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=1,016,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5297/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=1,017,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5298/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=1,017,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5299/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,017,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5300/500000] + optim/total_grad_norm=0.8331 + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,017,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5301/500000] + train/ActionNoiseL2Loss=0.0833 + throughput/total_tokens=1,017,792,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=5302/500000] + train/ActionNoiseL2Loss=0.1097 + throughput/total_tokens=1,017,984,000 + throughput/device/tokens_per_second=1,132 + throughput/device/batches_per_second=0.0472 +[step=5303/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=1,018,176,000 + throughput/device/tokens_per_second=1,129 + throughput/device/batches_per_second=0.0471 +[step=5304/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,018,368,000 + throughput/device/tokens_per_second=1,129 + throughput/device/batches_per_second=0.0470 +[step=5305/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,018,560,000 + throughput/device/tokens_per_second=1,129 + throughput/device/batches_per_second=0.0470 +[step=5306/500000] + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=1,018,752,000 + throughput/device/tokens_per_second=1,129 + throughput/device/batches_per_second=0.0471 +[step=5307/500000] + train/ActionNoiseL2Loss=0.1048 + throughput/total_tokens=1,018,944,000 + throughput/device/tokens_per_second=1,129 + throughput/device/batches_per_second=0.0471 +[step=5308/500000] + train/ActionNoiseL2Loss=0.1029 + throughput/total_tokens=1,019,136,000 + throughput/device/tokens_per_second=1,129 + throughput/device/batches_per_second=0.0471 +[step=5309/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=1,019,328,000 + throughput/device/tokens_per_second=1,129 + throughput/device/batches_per_second=0.0471 +[step=5310/500000] + train/ActionNoiseL2Loss=0.1834 + throughput/total_tokens=1,019,520,000 + throughput/device/tokens_per_second=1,129 + throughput/device/batches_per_second=0.0471 + System/Peak GPU Memory (MB)=51,076 +[step=5311/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=1,019,712,000 + throughput/device/tokens_per_second=1,129 + throughput/device/batches_per_second=0.0471 +[step=5312/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=1,019,904,000 + throughput/device/tokens_per_second=1,129 + throughput/device/batches_per_second=0.0471 +[step=5313/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=1,020,096,000 + throughput/device/tokens_per_second=1,129 + throughput/device/batches_per_second=0.0471 +[step=5314/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=1,020,288,000 + throughput/device/tokens_per_second=1,129 + throughput/device/batches_per_second=0.0471 +[step=5315/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,020,480,000 + throughput/device/tokens_per_second=1,129 + throughput/device/batches_per_second=0.0471 +[step=5316/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=1,020,672,000 + throughput/device/tokens_per_second=1,129 + throughput/device/batches_per_second=0.0471 +[step=5317/500000] + train/ActionNoiseL2Loss=0.0871 + throughput/total_tokens=1,020,864,000 + throughput/device/tokens_per_second=1,129 + throughput/device/batches_per_second=0.0471 +[step=5318/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,021,056,000 + throughput/device/tokens_per_second=1,129 + throughput/device/batches_per_second=0.0471 +[step=5319/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,021,248,000 + throughput/device/tokens_per_second=1,129 + throughput/device/batches_per_second=0.0470 +[step=5320/500000] + optim/total_grad_norm=0.9625 + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,021,440,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=5321/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,021,632,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5322/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,021,824,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5323/500000] + train/ActionNoiseL2Loss=0.0932 + throughput/total_tokens=1,022,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5324/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=1,022,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5325/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=1,022,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5326/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=1,022,592,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5327/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=1,022,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5328/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,022,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5329/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,023,168,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5330/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=1,023,360,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5331/500000] + train/ActionNoiseL2Loss=0.0946 + throughput/total_tokens=1,023,552,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5332/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=1,023,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5333/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,023,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5334/500000] + train/ActionNoiseL2Loss=0.0859 + throughput/total_tokens=1,024,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5335/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,024,320,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5336/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=1,024,512,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5337/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,024,704,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5338/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,024,896,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5339/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=1,025,088,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5340/500000] + optim/total_grad_norm=0.9252 + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=1,025,280,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5341/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=1,025,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5342/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=1,025,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5343/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=1,025,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5344/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,026,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5345/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,026,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5346/500000] + train/ActionNoiseL2Loss=0.0925 + throughput/total_tokens=1,026,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5347/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,026,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5348/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,026,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5349/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=1,027,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5350/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,027,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5351/500000] + train/ActionNoiseL2Loss=0.1381 + throughput/total_tokens=1,027,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5352/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=1,027,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5353/500000] + train/ActionNoiseL2Loss=0.0901 + throughput/total_tokens=1,027,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5354/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=1,027,968,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5355/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,028,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5356/500000] + train/ActionNoiseL2Loss=0.0827 + throughput/total_tokens=1,028,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5357/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=1,028,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5358/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,028,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5359/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=1,028,928,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5360/500000] + optim/total_grad_norm=1.195 + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=1,029,120,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=5361/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,029,312,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5362/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=1,029,504,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5363/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=1,029,696,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5364/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=1,029,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5365/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=1,030,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5366/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,030,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5367/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=1,030,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5368/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,030,656,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5369/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,030,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5370/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,031,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5371/500000] + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=1,031,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5372/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,031,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5373/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,031,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5374/500000] + train/ActionNoiseL2Loss=0.0892 + throughput/total_tokens=1,031,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5375/500000] + train/ActionNoiseL2Loss=0.1104 + throughput/total_tokens=1,032,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5376/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,032,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5377/500000] + train/ActionNoiseL2Loss=0.0935 + throughput/total_tokens=1,032,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5378/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,032,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5379/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,032,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5380/500000] + optim/total_grad_norm=1.335 + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=1,032,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5381/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,033,152,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5382/500000] + train/ActionNoiseL2Loss=0.0411 + throughput/total_tokens=1,033,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5383/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=1,033,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5384/500000] + train/ActionNoiseL2Loss=0.0922 + throughput/total_tokens=1,033,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5385/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=1,033,920,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5386/500000] + train/ActionNoiseL2Loss=0.0866 + throughput/total_tokens=1,034,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5387/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,034,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5388/500000] + train/ActionNoiseL2Loss=0.1478 + throughput/total_tokens=1,034,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5389/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,034,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5390/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,034,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5391/500000] + train/ActionNoiseL2Loss=0.1174 + throughput/total_tokens=1,035,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5392/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,035,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5393/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,035,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5394/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,035,648,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5395/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=1,035,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5396/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=1,036,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5397/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=1,036,224,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5398/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,036,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5399/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=1,036,608,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5400/500000] + optim/total_grad_norm=1.013 + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=1,036,800,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5401/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=1,036,992,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5402/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,037,184,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5403/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,037,376,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5404/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=1,037,568,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5405/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,037,760,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5406/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,037,952,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5407/500000] + train/ActionNoiseL2Loss=0.1233 + throughput/total_tokens=1,038,144,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5408/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,038,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5409/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,038,528,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5410/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=1,038,720,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=5411/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=1,038,912,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5412/500000] + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=1,039,104,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5413/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,039,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5414/500000] + train/ActionNoiseL2Loss=0.1047 + throughput/total_tokens=1,039,488,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5415/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=1,039,680,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5416/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=1,039,872,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5417/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,040,064,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5418/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,040,256,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5419/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,040,448,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5420/500000] + optim/total_grad_norm=0.7272 + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=1,040,640,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5421/500000] + train/ActionNoiseL2Loss=0.0879 + throughput/total_tokens=1,040,832,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5422/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,041,024,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5423/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=1,041,216,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5424/500000] + train/ActionNoiseL2Loss=0.1006 + throughput/total_tokens=1,041,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5425/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=1,041,600,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5426/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,041,792,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5427/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=1,041,984,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5428/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=1,042,176,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5429/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,042,368,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5430/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=1,042,560,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5431/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=1,042,752,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5432/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,042,944,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5433/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,043,136,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5434/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=1,043,328,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5435/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,043,520,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5436/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=1,043,712,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5437/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=1,043,904,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5438/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=1,044,096,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5439/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,044,288,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5440/500000] + optim/total_grad_norm=1.177 + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,044,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5441/500000] + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=1,044,672,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5442/500000] + train/ActionNoiseL2Loss=0.1169 + throughput/total_tokens=1,044,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5443/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,045,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5444/500000] + train/ActionNoiseL2Loss=0.1411 + throughput/total_tokens=1,045,248,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5445/500000] + train/ActionNoiseL2Loss=0.0776 + throughput/total_tokens=1,045,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5446/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=1,045,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5447/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=1,045,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5448/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,046,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5449/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=1,046,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5450/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,046,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5451/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=1,046,592,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5452/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,046,784,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5453/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=1,046,976,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5454/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,047,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5455/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,047,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5456/500000] + train/ActionNoiseL2Loss=0.0916 + throughput/total_tokens=1,047,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5457/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,047,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5458/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,047,936,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5459/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,048,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5460/500000] + optim/total_grad_norm=0.6813 + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,048,320,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=5461/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,048,512,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5462/500000] + train/ActionNoiseL2Loss=0.0937 + throughput/total_tokens=1,048,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5463/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,048,896,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5464/500000] + train/ActionNoiseL2Loss=0.0992 + throughput/total_tokens=1,049,088,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5465/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,049,280,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5466/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=1,049,472,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5467/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,049,664,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5468/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=1,049,856,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5469/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,050,048,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5470/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,050,240,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5471/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=1,050,432,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5472/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=1,050,624,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5473/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=1,050,816,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5474/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,051,008,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5475/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,051,200,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5476/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=1,051,392,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5477/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,051,584,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5478/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,051,776,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5479/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=1,051,968,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5480/500000] + optim/total_grad_norm=0.7228 + train/ActionNoiseL2Loss=0.0990 + throughput/total_tokens=1,052,160,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5481/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,052,352,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5482/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,052,544,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5483/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,052,736,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5484/500000] + train/ActionNoiseL2Loss=0.1025 + throughput/total_tokens=1,052,928,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5485/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,053,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5486/500000] + train/ActionNoiseL2Loss=0.1296 + throughput/total_tokens=1,053,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5487/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,053,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5488/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,053,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5489/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=1,053,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5490/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=1,054,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5491/500000] + train/ActionNoiseL2Loss=0.0981 + throughput/total_tokens=1,054,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5492/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=1,054,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5493/500000] + train/ActionNoiseL2Loss=0.0845 + throughput/total_tokens=1,054,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5494/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,054,848,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5495/500000] + train/ActionNoiseL2Loss=0.0411 + throughput/total_tokens=1,055,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5496/500000] + train/ActionNoiseL2Loss=0.1164 + throughput/total_tokens=1,055,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5497/500000] + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=1,055,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5498/500000] + train/ActionNoiseL2Loss=0.1071 + throughput/total_tokens=1,055,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5499/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=1,055,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5500/500000] + optim/total_grad_norm=1.133 + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=1,056,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +10/13 [01:26:50] INFO | >> Saving config... checkpoint.py:608 +10/13 [01:27:22] INFO | >> Saving model state... checkpoint.py:796 +10/13 [01:28:35] INFO | >> Saving optim state... checkpoint.py:811 +10/13 [01:30:05] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=5501/500000] + train/ActionNoiseL2Loss=0.0898 + throughput/total_tokens=1,056,192,000 + throughput/device/tokens_per_second=1,132 + throughput/device/batches_per_second=0.0472 +[step=5502/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=1,056,384,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0474 +[step=5503/500000] + train/ActionNoiseL2Loss=0.0752 + throughput/total_tokens=1,056,576,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=5504/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=1,056,768,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=5505/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=1,056,960,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5506/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,057,152,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5507/500000] + train/ActionNoiseL2Loss=0.1239 + throughput/total_tokens=1,057,344,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5508/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,057,536,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5509/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,057,728,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5510/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=1,057,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5511/500000] + train/ActionNoiseL2Loss=0.0339 + throughput/total_tokens=1,058,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5512/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,058,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5513/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,058,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5514/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=1,058,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5515/500000] + train/ActionNoiseL2Loss=0.1245 + throughput/total_tokens=1,058,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5516/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=1,059,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5517/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=1,059,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5518/500000] + train/ActionNoiseL2Loss=0.0985 + throughput/total_tokens=1,059,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5519/500000] + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=1,059,648,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5520/500000] + optim/total_grad_norm=0.9626 + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=1,059,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5521/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=1,060,032,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5522/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=1,060,224,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5523/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=1,060,416,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5524/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=1,060,608,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5525/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=1,060,800,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5526/500000] + train/ActionNoiseL2Loss=0.0909 + throughput/total_tokens=1,060,992,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5527/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=1,061,184,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5528/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=1,061,376,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5529/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=1,061,568,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5530/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=1,061,760,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5531/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=1,061,952,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5532/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,062,144,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5533/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=1,062,336,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5534/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,062,528,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5535/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,062,720,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5536/500000] + train/ActionNoiseL2Loss=0.0385 + throughput/total_tokens=1,062,912,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5537/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,063,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5538/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,063,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5539/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=1,063,488,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5540/500000] + optim/total_grad_norm=0.9892 + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=1,063,680,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5541/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=1,063,872,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5542/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=1,064,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5543/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,064,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5544/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=1,064,448,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5545/500000] + train/ActionNoiseL2Loss=0.0802 + throughput/total_tokens=1,064,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5546/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=1,064,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5547/500000] + train/ActionNoiseL2Loss=0.0949 + throughput/total_tokens=1,065,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5548/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=1,065,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5549/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,065,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5550/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=1,065,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5551/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,065,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5552/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,065,984,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5553/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,066,176,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5554/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=1,066,368,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5555/500000] + train/ActionNoiseL2Loss=0.1338 + throughput/total_tokens=1,066,560,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5556/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=1,066,752,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5557/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=1,066,944,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5558/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=1,067,136,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5559/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,067,328,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5560/500000] + optim/total_grad_norm=1.259 + train/ActionNoiseL2Loss=0.0836 + throughput/total_tokens=1,067,520,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=5561/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,067,712,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5562/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,067,904,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5563/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,068,096,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5564/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=1,068,288,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5565/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=1,068,480,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5566/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=1,068,672,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5567/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=1,068,864,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5568/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,069,056,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5569/500000] + train/ActionNoiseL2Loss=0.0884 + throughput/total_tokens=1,069,248,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5570/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,069,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5571/500000] + train/ActionNoiseL2Loss=0.1158 + throughput/total_tokens=1,069,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5572/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=1,069,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5573/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=1,070,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5574/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,070,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5575/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=1,070,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5576/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=1,070,592,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5577/500000] + train/ActionNoiseL2Loss=0.1196 + throughput/total_tokens=1,070,784,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5578/500000] + train/ActionNoiseL2Loss=0.0863 + throughput/total_tokens=1,070,976,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5579/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=1,071,168,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5580/500000] + optim/total_grad_norm=0.9125 + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,071,360,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5581/500000] + train/ActionNoiseL2Loss=0.1123 + throughput/total_tokens=1,071,552,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=5582/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=1,071,744,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5583/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=1,071,936,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5584/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,072,128,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5585/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,072,320,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5586/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,072,512,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5587/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,072,704,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5588/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,072,896,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5589/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=1,073,088,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5590/500000] + train/ActionNoiseL2Loss=0.0691 + throughput/total_tokens=1,073,280,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5591/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,073,472,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5592/500000] + train/ActionNoiseL2Loss=0.0831 + throughput/total_tokens=1,073,664,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5593/500000] + train/ActionNoiseL2Loss=0.1030 + throughput/total_tokens=1,073,856,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5594/500000] + train/ActionNoiseL2Loss=0.1074 + throughput/total_tokens=1,074,048,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5595/500000] + train/ActionNoiseL2Loss=0.0832 + throughput/total_tokens=1,074,240,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5596/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,074,432,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5597/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=1,074,624,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5598/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=1,074,816,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5599/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,075,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5600/500000] + optim/total_grad_norm=1.439 + train/ActionNoiseL2Loss=0.1097 + throughput/total_tokens=1,075,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5601/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=1,075,392,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5602/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=1,075,584,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5603/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,075,776,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5604/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=1,075,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5605/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,076,160,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5606/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=1,076,352,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5607/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,076,544,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5608/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,076,736,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5609/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=1,076,928,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5610/500000] + train/ActionNoiseL2Loss=0.1658 + throughput/total_tokens=1,077,120,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=5611/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=1,077,312,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5612/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,077,504,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5613/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,077,696,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5614/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,077,888,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5615/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,078,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5616/500000] + train/ActionNoiseL2Loss=0.0874 + throughput/total_tokens=1,078,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5617/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,078,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5618/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,078,656,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5619/500000] + train/ActionNoiseL2Loss=0.1118 + throughput/total_tokens=1,078,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5620/500000] + optim/total_grad_norm=1.060 + train/ActionNoiseL2Loss=0.0947 + throughput/total_tokens=1,079,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5621/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,079,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5622/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,079,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5623/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,079,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5624/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,079,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5625/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,080,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5626/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=1,080,192,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5627/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=1,080,384,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5628/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,080,576,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5629/500000] + train/ActionNoiseL2Loss=0.0917 + throughput/total_tokens=1,080,768,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5630/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,080,960,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5631/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,081,152,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5632/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=1,081,344,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5633/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,081,536,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5634/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=1,081,728,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5635/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,081,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5636/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,082,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5637/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,082,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5638/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=1,082,496,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5639/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,082,688,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5640/500000] + optim/total_grad_norm=1.124 + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=1,082,880,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=5641/500000] + train/ActionNoiseL2Loss=0.0344 + throughput/total_tokens=1,083,072,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5642/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,083,264,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5643/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,083,456,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5644/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=1,083,648,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5645/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,083,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5646/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,084,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5647/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=1,084,224,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5648/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=1,084,416,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5649/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,084,608,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5650/500000] + train/ActionNoiseL2Loss=0.1127 + throughput/total_tokens=1,084,800,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5651/500000] + train/ActionNoiseL2Loss=0.0785 + throughput/total_tokens=1,084,992,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5652/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,085,184,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5653/500000] + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=1,085,376,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5654/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,085,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5655/500000] + train/ActionNoiseL2Loss=0.1429 + throughput/total_tokens=1,085,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5656/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=1,085,952,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5657/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,086,144,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5658/500000] + train/ActionNoiseL2Loss=0.0263 + throughput/total_tokens=1,086,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5659/500000] + train/ActionNoiseL2Loss=0.0270 + throughput/total_tokens=1,086,528,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5660/500000] + optim/total_grad_norm=2.036 + train/ActionNoiseL2Loss=0.1189 + throughput/total_tokens=1,086,720,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=5661/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=1,086,912,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5662/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=1,087,104,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5663/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,087,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5664/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,087,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5665/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,087,680,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5666/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=1,087,872,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5667/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,088,064,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5668/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,088,256,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5669/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=1,088,448,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5670/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,088,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5671/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,088,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5672/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=1,089,024,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5673/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,089,216,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5674/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,089,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5675/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,089,600,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5676/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=1,089,792,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5677/500000] + train/ActionNoiseL2Loss=0.0918 + throughput/total_tokens=1,089,984,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5678/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=1,090,176,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5679/500000] + train/ActionNoiseL2Loss=0.1216 + throughput/total_tokens=1,090,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5680/500000] + optim/total_grad_norm=1.107 + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=1,090,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5681/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,090,752,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5682/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,090,944,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5683/500000] + train/ActionNoiseL2Loss=0.0909 + throughput/total_tokens=1,091,136,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5684/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=1,091,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5685/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=1,091,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5686/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=1,091,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5687/500000] + train/ActionNoiseL2Loss=0.0917 + throughput/total_tokens=1,091,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5688/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=1,092,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5689/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,092,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5690/500000] + train/ActionNoiseL2Loss=0.1218 + throughput/total_tokens=1,092,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5691/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,092,672,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5692/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=1,092,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5693/500000] + train/ActionNoiseL2Loss=0.1054 + throughput/total_tokens=1,093,056,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5694/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,093,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5695/500000] + train/ActionNoiseL2Loss=0.0986 + throughput/total_tokens=1,093,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5696/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=1,093,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5697/500000] + train/ActionNoiseL2Loss=0.0957 + throughput/total_tokens=1,093,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5698/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=1,094,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5699/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,094,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5700/500000] + optim/total_grad_norm=1.157 + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=1,094,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5701/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,094,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5702/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,094,784,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5703/500000] + train/ActionNoiseL2Loss=0.1120 + throughput/total_tokens=1,094,976,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5704/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=1,095,168,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5705/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=1,095,360,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5706/500000] + train/ActionNoiseL2Loss=0.0831 + throughput/total_tokens=1,095,552,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5707/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=1,095,744,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5708/500000] + train/ActionNoiseL2Loss=0.0224 + throughput/total_tokens=1,095,936,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5709/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,096,128,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5710/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,096,320,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=5711/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,096,512,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5712/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,096,704,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5713/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,096,896,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5714/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=1,097,088,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5715/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,097,280,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5716/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=1,097,472,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5717/500000] + train/ActionNoiseL2Loss=0.0977 + throughput/total_tokens=1,097,664,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5718/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=1,097,856,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5719/500000] + train/ActionNoiseL2Loss=0.0243 + throughput/total_tokens=1,098,048,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=5720/500000] + optim/total_grad_norm=1.040 + train/ActionNoiseL2Loss=0.0827 + throughput/total_tokens=1,098,240,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5721/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=1,098,432,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5722/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=1,098,624,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5723/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=1,098,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5724/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=1,099,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5725/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=1,099,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5726/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,099,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5727/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=1,099,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5728/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,099,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5729/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,099,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5730/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=1,100,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5731/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=1,100,352,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5732/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=1,100,544,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5733/500000] + train/ActionNoiseL2Loss=0.0927 + throughput/total_tokens=1,100,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5734/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=1,100,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5735/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=1,101,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5736/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=1,101,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5737/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=1,101,504,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5738/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,101,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5739/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,101,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5740/500000] + optim/total_grad_norm=0.7273 + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=1,102,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5741/500000] + train/ActionNoiseL2Loss=0.0958 + throughput/total_tokens=1,102,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5742/500000] + train/ActionNoiseL2Loss=0.1098 + throughput/total_tokens=1,102,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5743/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=1,102,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5744/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,102,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5745/500000] + train/ActionNoiseL2Loss=0.0991 + throughput/total_tokens=1,103,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5746/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=1,103,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5747/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=1,103,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5748/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,103,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5749/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=1,103,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5750/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=1,104,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5751/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=1,104,192,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5752/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=1,104,384,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5753/500000] + train/ActionNoiseL2Loss=0.1155 + throughput/total_tokens=1,104,576,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5754/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,104,768,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5755/500000] + train/ActionNoiseL2Loss=0.0256 + throughput/total_tokens=1,104,960,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5756/500000] + train/ActionNoiseL2Loss=0.0324 + throughput/total_tokens=1,105,152,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5757/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,105,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5758/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,105,536,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5759/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=1,105,728,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5760/500000] + optim/total_grad_norm=0.7225 + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=1,105,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5761/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,106,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5762/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=1,106,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5763/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,106,496,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5764/500000] + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=1,106,688,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5765/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=1,106,880,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5766/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=1,107,072,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5767/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=1,107,264,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5768/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=1,107,456,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5769/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=1,107,648,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5770/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=1,107,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5771/500000] + train/ActionNoiseL2Loss=0.0917 + throughput/total_tokens=1,108,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5772/500000] + train/ActionNoiseL2Loss=0.1007 + throughput/total_tokens=1,108,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5773/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=1,108,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5774/500000] + train/ActionNoiseL2Loss=0.1244 + throughput/total_tokens=1,108,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5775/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,108,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5776/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,108,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5777/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=1,109,184,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5778/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,109,376,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5779/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=1,109,568,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5780/500000] + optim/total_grad_norm=1.267 + train/ActionNoiseL2Loss=0.1227 + throughput/total_tokens=1,109,760,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5781/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=1,109,952,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5782/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=1,110,144,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5783/500000] + train/ActionNoiseL2Loss=0.0888 + throughput/total_tokens=1,110,336,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5784/500000] + train/ActionNoiseL2Loss=0.0937 + throughput/total_tokens=1,110,528,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5785/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,110,720,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5786/500000] + train/ActionNoiseL2Loss=0.0292 + throughput/total_tokens=1,110,912,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5787/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=1,111,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5788/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=1,111,296,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5789/500000] + train/ActionNoiseL2Loss=0.0301 + throughput/total_tokens=1,111,488,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5790/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=1,111,680,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5791/500000] + train/ActionNoiseL2Loss=0.0361 + throughput/total_tokens=1,111,872,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5792/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=1,112,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5793/500000] + train/ActionNoiseL2Loss=0.0324 + throughput/total_tokens=1,112,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5794/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,112,448,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5795/500000] + train/ActionNoiseL2Loss=0.0916 + throughput/total_tokens=1,112,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5796/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=1,112,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5797/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,113,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5798/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=1,113,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5799/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,113,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5800/500000] + optim/total_grad_norm=0.7754 + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=1,113,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5801/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,113,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5802/500000] + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=1,113,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5803/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,114,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5804/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,114,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5805/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,114,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5806/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=1,114,752,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5807/500000] + train/ActionNoiseL2Loss=0.0924 + throughput/total_tokens=1,114,944,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5808/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=1,115,136,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5809/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,115,328,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5810/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,115,520,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=5811/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,115,712,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=5812/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=1,115,904,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=5813/500000] + train/ActionNoiseL2Loss=0.1031 + throughput/total_tokens=1,116,096,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=5814/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,116,288,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=5815/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,116,480,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=5816/500000] + train/ActionNoiseL2Loss=0.0222 + throughput/total_tokens=1,116,672,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=5817/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=1,116,864,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=5818/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=1,117,056,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=5819/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,117,248,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=5820/500000] + optim/total_grad_norm=1.027 + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=1,117,440,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=5821/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=1,117,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5822/500000] + train/ActionNoiseL2Loss=0.1092 + throughput/total_tokens=1,117,824,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5823/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,118,016,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5824/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=1,118,208,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5825/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=1,118,400,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5826/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=1,118,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5827/500000] + train/ActionNoiseL2Loss=0.0954 + throughput/total_tokens=1,118,784,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5828/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=1,118,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5829/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=1,119,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5830/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=1,119,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5831/500000] + train/ActionNoiseL2Loss=0.0916 + throughput/total_tokens=1,119,552,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5832/500000] + train/ActionNoiseL2Loss=0.1361 + throughput/total_tokens=1,119,744,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5833/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,119,936,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5834/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=1,120,128,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5835/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,120,320,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5836/500000] + train/ActionNoiseL2Loss=0.0272 + throughput/total_tokens=1,120,512,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5837/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=1,120,704,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5838/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,120,896,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5839/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,121,088,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5840/500000] + optim/total_grad_norm=0.7364 + train/ActionNoiseL2Loss=0.0340 + throughput/total_tokens=1,121,280,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5841/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=1,121,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5842/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=1,121,664,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5843/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=1,121,856,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5844/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,122,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5845/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=1,122,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5846/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,122,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5847/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=1,122,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5848/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,122,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5849/500000] + train/ActionNoiseL2Loss=0.1113 + throughput/total_tokens=1,123,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5850/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,123,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5851/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,123,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5852/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,123,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5853/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=1,123,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5854/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,123,968,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5855/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=1,124,160,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5856/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=1,124,352,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5857/500000] + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=1,124,544,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=5858/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,124,736,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=5859/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=1,124,928,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5860/500000] + optim/total_grad_norm=0.9609 + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=1,125,120,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=5861/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,125,312,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5862/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,125,504,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=5863/500000] + train/ActionNoiseL2Loss=0.1015 + throughput/total_tokens=1,125,696,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=5864/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,125,888,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=5865/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=1,126,080,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5866/500000] + train/ActionNoiseL2Loss=0.0993 + throughput/total_tokens=1,126,272,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5867/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,126,464,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5868/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=1,126,656,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5869/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=1,126,848,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=5870/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=1,127,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5871/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=1,127,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5872/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=1,127,424,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5873/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=1,127,616,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5874/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,127,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5875/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,128,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5876/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=1,128,192,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5877/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=1,128,384,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5878/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=1,128,576,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5879/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,128,768,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5880/500000] + optim/total_grad_norm=1.047 + train/ActionNoiseL2Loss=0.0904 + throughput/total_tokens=1,128,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5881/500000] + train/ActionNoiseL2Loss=0.1231 + throughput/total_tokens=1,129,152,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5882/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,129,344,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5883/500000] + train/ActionNoiseL2Loss=0.0876 + throughput/total_tokens=1,129,536,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=5884/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=1,129,728,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5885/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,129,920,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5886/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=1,130,112,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5887/500000] + train/ActionNoiseL2Loss=0.0937 + throughput/total_tokens=1,130,304,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5888/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,130,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5889/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=1,130,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5890/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,130,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5891/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,131,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5892/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,131,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5893/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,131,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5894/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=1,131,648,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5895/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=1,131,840,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5896/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,132,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5897/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=1,132,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=5898/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,132,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5899/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=1,132,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5900/500000] + optim/total_grad_norm=1.186 + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,132,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5901/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,132,992,000 + throughput/device/tokens_per_second=1,127 + throughput/device/batches_per_second=0.0470 +[step=5902/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=1,133,184,000 + throughput/device/tokens_per_second=1,127 + throughput/device/batches_per_second=0.0470 +[step=5903/500000] + train/ActionNoiseL2Loss=0.1078 + throughput/total_tokens=1,133,376,000 + throughput/device/tokens_per_second=1,127 + throughput/device/batches_per_second=0.0470 +[step=5904/500000] + train/ActionNoiseL2Loss=0.0867 + throughput/total_tokens=1,133,568,000 + throughput/device/tokens_per_second=1,126 + throughput/device/batches_per_second=0.0469 +[step=5905/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,133,760,000 + throughput/device/tokens_per_second=1,126 + throughput/device/batches_per_second=0.0469 +[step=5906/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=1,133,952,000 + throughput/device/tokens_per_second=1,126 + throughput/device/batches_per_second=0.0469 +[step=5907/500000] + train/ActionNoiseL2Loss=0.0320 + throughput/total_tokens=1,134,144,000 + throughput/device/tokens_per_second=1,126 + throughput/device/batches_per_second=0.0469 +[step=5908/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=1,134,336,000 + throughput/device/tokens_per_second=1,126 + throughput/device/batches_per_second=0.0469 +[step=5909/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,134,528,000 + throughput/device/tokens_per_second=1,126 + throughput/device/batches_per_second=0.0469 +[step=5910/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=1,134,720,000 + throughput/device/tokens_per_second=1,126 + throughput/device/batches_per_second=0.0469 + System/Peak GPU Memory (MB)=51,076 +[step=5911/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=1,134,912,000 + throughput/device/tokens_per_second=1,126 + throughput/device/batches_per_second=0.0469 +[step=5912/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=1,135,104,000 + throughput/device/tokens_per_second=1,126 + throughput/device/batches_per_second=0.0469 +[step=5913/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=1,135,296,000 + throughput/device/tokens_per_second=1,125 + throughput/device/batches_per_second=0.0469 +[step=5914/500000] + train/ActionNoiseL2Loss=0.0872 + throughput/total_tokens=1,135,488,000 + throughput/device/tokens_per_second=1,126 + throughput/device/batches_per_second=0.0469 +[step=5915/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=1,135,680,000 + throughput/device/tokens_per_second=1,126 + throughput/device/batches_per_second=0.0469 +[step=5916/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,135,872,000 + throughput/device/tokens_per_second=1,126 + throughput/device/batches_per_second=0.0469 +[step=5917/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=1,136,064,000 + throughput/device/tokens_per_second=1,126 + throughput/device/batches_per_second=0.0470 +[step=5918/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,136,256,000 + throughput/device/tokens_per_second=1,126 + throughput/device/batches_per_second=0.0469 +[step=5919/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=1,136,448,000 + throughput/device/tokens_per_second=1,126 + throughput/device/batches_per_second=0.0469 +[step=5920/500000] + optim/total_grad_norm=1.479 + train/ActionNoiseL2Loss=0.0966 + throughput/total_tokens=1,136,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5921/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=1,136,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5922/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,137,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5923/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=1,137,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5924/500000] + train/ActionNoiseL2Loss=0.0752 + throughput/total_tokens=1,137,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5925/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,137,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5926/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=1,137,792,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5927/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=1,137,984,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5928/500000] + train/ActionNoiseL2Loss=0.0175 + throughput/total_tokens=1,138,176,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5929/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,138,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5930/500000] + train/ActionNoiseL2Loss=0.0997 + throughput/total_tokens=1,138,560,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5931/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,138,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5932/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=1,138,944,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5933/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=1,139,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5934/500000] + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=1,139,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5935/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,139,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5936/500000] + train/ActionNoiseL2Loss=0.1290 + throughput/total_tokens=1,139,712,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5937/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,139,904,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5938/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,140,096,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5939/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=1,140,288,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5940/500000] + optim/total_grad_norm=0.9446 + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=1,140,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5941/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=1,140,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5942/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,140,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5943/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=1,141,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5944/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,141,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5945/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=1,141,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5946/500000] + train/ActionNoiseL2Loss=0.1077 + throughput/total_tokens=1,141,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5947/500000] + train/ActionNoiseL2Loss=0.1443 + throughput/total_tokens=1,141,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5948/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=1,142,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5949/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=1,142,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5950/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=1,142,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=5951/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=1,142,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=5952/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,142,784,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5953/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=1,142,976,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5954/500000] + train/ActionNoiseL2Loss=0.0848 + throughput/total_tokens=1,143,168,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5955/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=1,143,360,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5956/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,143,552,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5957/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,143,744,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5958/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=1,143,936,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5959/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=1,144,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5960/500000] + optim/total_grad_norm=0.7371 + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=1,144,320,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=5961/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=1,144,512,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5962/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,144,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5963/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,144,896,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5964/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,145,088,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=5965/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,145,280,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5966/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=1,145,472,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5967/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=1,145,664,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5968/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=1,145,856,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5969/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,146,048,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=5970/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,146,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5971/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=1,146,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5972/500000] + train/ActionNoiseL2Loss=0.1035 + throughput/total_tokens=1,146,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5973/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,146,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5974/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=1,147,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5975/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=1,147,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5976/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,147,392,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5977/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=1,147,584,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5978/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,147,776,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=5979/500000] + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=1,147,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5980/500000] + optim/total_grad_norm=0.9146 + train/ActionNoiseL2Loss=0.0877 + throughput/total_tokens=1,148,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5981/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=1,148,352,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5982/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,148,544,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5983/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,148,736,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5984/500000] + train/ActionNoiseL2Loss=0.0289 + throughput/total_tokens=1,148,928,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5985/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,149,120,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5986/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=1,149,312,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5987/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=1,149,504,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5988/500000] + train/ActionNoiseL2Loss=0.1035 + throughput/total_tokens=1,149,696,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5989/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=1,149,888,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5990/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,150,080,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=5991/500000] + train/ActionNoiseL2Loss=0.0907 + throughput/total_tokens=1,150,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5992/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=1,150,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5993/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,150,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5994/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,150,848,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5995/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,151,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5996/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=1,151,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5997/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=1,151,424,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=5998/500000] + train/ActionNoiseL2Loss=0.0859 + throughput/total_tokens=1,151,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5999/500000] + train/ActionNoiseL2Loss=0.1088 + throughput/total_tokens=1,151,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6000/500000] + optim/total_grad_norm=1.260 + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=1,152,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +10/13 [04:25:43] INFO | >> Saving config... checkpoint.py:608 +10/13 [04:26:26] INFO | >> Saving model state... checkpoint.py:796 +10/13 [04:27:39] INFO | >> Saving optim state... checkpoint.py:811 +10/13 [04:29:12] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=6001/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,152,192,000 + throughput/device/tokens_per_second=1,128 + throughput/device/batches_per_second=0.0470 +[step=6002/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,152,384,000 + throughput/device/tokens_per_second=1,131 + throughput/device/batches_per_second=0.0471 +[step=6003/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=1,152,576,000 + throughput/device/tokens_per_second=1,111 + throughput/device/batches_per_second=0.0463 +[step=6004/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=1,152,768,000 + throughput/device/tokens_per_second=1,118 + throughput/device/batches_per_second=0.0466 +[step=6005/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=1,152,960,000 + throughput/device/tokens_per_second=1,124 + throughput/device/batches_per_second=0.0469 +[step=6006/500000] + train/ActionNoiseL2Loss=0.0836 + throughput/total_tokens=1,153,152,000 + throughput/device/tokens_per_second=1,128 + throughput/device/batches_per_second=0.0470 +[step=6007/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,153,344,000 + throughput/device/tokens_per_second=1,131 + throughput/device/batches_per_second=0.0471 +[step=6008/500000] + train/ActionNoiseL2Loss=0.0975 + throughput/total_tokens=1,153,536,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=6009/500000] + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=1,153,728,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=6010/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=1,153,920,000 + throughput/device/tokens_per_second=1,136 + throughput/device/batches_per_second=0.0474 + System/Peak GPU Memory (MB)=51,076 +[step=6011/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=1,154,112,000 + throughput/device/tokens_per_second=1,137 + throughput/device/batches_per_second=0.0474 +[step=6012/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,154,304,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0474 +[step=6013/500000] + train/ActionNoiseL2Loss=0.1038 + throughput/total_tokens=1,154,496,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=6014/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,154,688,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=6015/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,154,880,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0475 +[step=6016/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=1,155,072,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=6017/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=1,155,264,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=6018/500000] + train/ActionNoiseL2Loss=0.0845 + throughput/total_tokens=1,155,456,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=6019/500000] + train/ActionNoiseL2Loss=0.0863 + throughput/total_tokens=1,155,648,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=6020/500000] + optim/total_grad_norm=0.7203 + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,155,840,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 + System/Peak GPU Memory (MB)=51,076 +[step=6021/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=1,156,032,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6022/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,156,224,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6023/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,156,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6024/500000] + train/ActionNoiseL2Loss=0.0335 + throughput/total_tokens=1,156,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6025/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=1,156,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6026/500000] + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=1,156,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6027/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,157,184,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6028/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=1,157,376,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6029/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=1,157,568,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6030/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=1,157,760,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=6031/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=1,157,952,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6032/500000] + train/ActionNoiseL2Loss=0.0950 + throughput/total_tokens=1,158,144,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6033/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,158,336,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6034/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=1,158,528,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6035/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=1,158,720,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6036/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,158,912,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6037/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=1,159,104,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6038/500000] + train/ActionNoiseL2Loss=0.0273 + throughput/total_tokens=1,159,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6039/500000] + train/ActionNoiseL2Loss=0.1478 + throughput/total_tokens=1,159,488,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6040/500000] + optim/total_grad_norm=0.8251 + train/ActionNoiseL2Loss=0.0324 + throughput/total_tokens=1,159,680,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=6041/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,159,872,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6042/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=1,160,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6043/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=1,160,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6044/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=1,160,448,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6045/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=1,160,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6046/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,160,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6047/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,161,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6048/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=1,161,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6049/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=1,161,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6050/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,161,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6051/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=1,161,792,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6052/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=1,161,984,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6053/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=1,162,176,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6054/500000] + train/ActionNoiseL2Loss=0.0977 + throughput/total_tokens=1,162,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6055/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=1,162,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6056/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=1,162,752,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6057/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,162,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6058/500000] + train/ActionNoiseL2Loss=0.0709 + throughput/total_tokens=1,163,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6059/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=1,163,328,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6060/500000] + optim/total_grad_norm=0.8532 + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=1,163,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6061/500000] + train/ActionNoiseL2Loss=0.1181 + throughput/total_tokens=1,163,712,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6062/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,163,904,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6063/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,164,096,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6064/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=1,164,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6065/500000] + train/ActionNoiseL2Loss=0.0843 + throughput/total_tokens=1,164,480,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6066/500000] + train/ActionNoiseL2Loss=0.0876 + throughput/total_tokens=1,164,672,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6067/500000] + train/ActionNoiseL2Loss=0.1099 + throughput/total_tokens=1,164,864,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6068/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=1,165,056,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6069/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=1,165,248,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6070/500000] + train/ActionNoiseL2Loss=0.1171 + throughput/total_tokens=1,165,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=6071/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=1,165,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6072/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=1,165,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6073/500000] + train/ActionNoiseL2Loss=0.1284 + throughput/total_tokens=1,166,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6074/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=1,166,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6075/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,166,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6076/500000] + train/ActionNoiseL2Loss=0.0985 + throughput/total_tokens=1,166,592,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6077/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=1,166,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6078/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,166,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6079/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=1,167,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6080/500000] + optim/total_grad_norm=1.227 + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=1,167,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6081/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=1,167,552,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6082/500000] + train/ActionNoiseL2Loss=0.0391 + throughput/total_tokens=1,167,744,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6083/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=1,167,936,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6084/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,168,128,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6085/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,168,320,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6086/500000] + train/ActionNoiseL2Loss=0.1021 + throughput/total_tokens=1,168,512,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6087/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,168,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6088/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,168,896,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6089/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=1,169,088,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6090/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=1,169,280,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6091/500000] + train/ActionNoiseL2Loss=0.0831 + throughput/total_tokens=1,169,472,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6092/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,169,664,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6093/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=1,169,856,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6094/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,170,048,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6095/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,170,240,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6096/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=1,170,432,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6097/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=1,170,624,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6098/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=1,170,816,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6099/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=1,171,008,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6100/500000] + optim/total_grad_norm=1.258 + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=1,171,200,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6101/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,171,392,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6102/500000] + train/ActionNoiseL2Loss=0.0298 + throughput/total_tokens=1,171,584,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6103/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,171,776,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6104/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,171,968,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6105/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,172,160,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6106/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=1,172,352,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6107/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=1,172,544,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6108/500000] + train/ActionNoiseL2Loss=0.1127 + throughput/total_tokens=1,172,736,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6109/500000] + train/ActionNoiseL2Loss=0.1088 + throughput/total_tokens=1,172,928,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6110/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,173,120,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=6111/500000] + train/ActionNoiseL2Loss=0.1097 + throughput/total_tokens=1,173,312,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6112/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=1,173,504,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6113/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=1,173,696,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6114/500000] + train/ActionNoiseL2Loss=0.1253 + throughput/total_tokens=1,173,888,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6115/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=1,174,080,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6116/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,174,272,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6117/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,174,464,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6118/500000] + train/ActionNoiseL2Loss=0.1433 + throughput/total_tokens=1,174,656,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6119/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,174,848,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6120/500000] + optim/total_grad_norm=1.198 + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=1,175,040,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6121/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=1,175,232,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6122/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=1,175,424,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6123/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,175,616,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6124/500000] + train/ActionNoiseL2Loss=0.0295 + throughput/total_tokens=1,175,808,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6125/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=1,176,000,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6126/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,176,192,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6127/500000] + train/ActionNoiseL2Loss=0.1183 + throughput/total_tokens=1,176,384,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6128/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=1,176,576,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6129/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,176,768,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6130/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,176,960,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6131/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,177,152,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6132/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=1,177,344,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6133/500000] + train/ActionNoiseL2Loss=0.1231 + throughput/total_tokens=1,177,536,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6134/500000] + train/ActionNoiseL2Loss=0.0827 + throughput/total_tokens=1,177,728,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6135/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=1,177,920,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6136/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=1,178,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6137/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=1,178,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6138/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=1,178,496,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6139/500000] + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=1,178,688,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6140/500000] + optim/total_grad_norm=0.9519 + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=1,178,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6141/500000] + train/ActionNoiseL2Loss=0.0919 + throughput/total_tokens=1,179,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6142/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,179,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6143/500000] + train/ActionNoiseL2Loss=0.0932 + throughput/total_tokens=1,179,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6144/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,179,648,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6145/500000] + train/ActionNoiseL2Loss=0.1459 + throughput/total_tokens=1,179,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6146/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=1,180,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6147/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=1,180,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6148/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,180,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6149/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=1,180,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6150/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=1,180,800,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=6151/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=1,180,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6152/500000] + train/ActionNoiseL2Loss=0.0928 + throughput/total_tokens=1,181,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6153/500000] + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=1,181,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6154/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=1,181,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6155/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=1,181,760,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6156/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=1,181,952,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6157/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=1,182,144,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6158/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,182,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6159/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=1,182,528,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6160/500000] + optim/total_grad_norm=2.394 + train/ActionNoiseL2Loss=0.0853 + throughput/total_tokens=1,182,720,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=6161/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,182,912,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6162/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,183,104,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6163/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=1,183,296,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6164/500000] + train/ActionNoiseL2Loss=0.0921 + throughput/total_tokens=1,183,488,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6165/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,183,680,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6166/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=1,183,872,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6167/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,184,064,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6168/500000] + train/ActionNoiseL2Loss=0.1596 + throughput/total_tokens=1,184,256,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6169/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=1,184,448,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6170/500000] + train/ActionNoiseL2Loss=0.0252 + throughput/total_tokens=1,184,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6171/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=1,184,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6172/500000] + train/ActionNoiseL2Loss=0.0991 + throughput/total_tokens=1,185,024,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6173/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,185,216,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6174/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=1,185,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6175/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,185,600,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6176/500000] + train/ActionNoiseL2Loss=0.1138 + throughput/total_tokens=1,185,792,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6177/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=1,185,984,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6178/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=1,186,176,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6179/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=1,186,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6180/500000] + optim/total_grad_norm=1.213 + train/ActionNoiseL2Loss=0.1424 + throughput/total_tokens=1,186,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6181/500000] + train/ActionNoiseL2Loss=0.1015 + throughput/total_tokens=1,186,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6182/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=1,186,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6183/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,187,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6184/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=1,187,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6185/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,187,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6186/500000] + train/ActionNoiseL2Loss=0.1005 + throughput/total_tokens=1,187,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6187/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=1,187,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6188/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=1,188,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6189/500000] + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=1,188,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6190/500000] + train/ActionNoiseL2Loss=0.0772 + throughput/total_tokens=1,188,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6191/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,188,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6192/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,188,864,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6193/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,189,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6194/500000] + train/ActionNoiseL2Loss=0.0951 + throughput/total_tokens=1,189,248,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6195/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,189,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6196/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,189,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6197/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=1,189,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6198/500000] + train/ActionNoiseL2Loss=0.1207 + throughput/total_tokens=1,190,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6199/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,190,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6200/500000] + optim/total_grad_norm=0.9534 + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,190,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6201/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=1,190,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6202/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,190,784,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6203/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,190,976,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6204/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,191,168,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6205/500000] + train/ActionNoiseL2Loss=0.1003 + throughput/total_tokens=1,191,360,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6206/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,191,552,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6207/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,191,744,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6208/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=1,191,936,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6209/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=1,192,128,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6210/500000] + train/ActionNoiseL2Loss=0.1104 + throughput/total_tokens=1,192,320,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6211/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=1,192,512,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6212/500000] + train/ActionNoiseL2Loss=0.0881 + throughput/total_tokens=1,192,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6213/500000] + train/ActionNoiseL2Loss=0.0941 + throughput/total_tokens=1,192,896,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6214/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=1,193,088,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6215/500000] + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=1,193,280,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6216/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,193,472,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6217/500000] + train/ActionNoiseL2Loss=0.1326 + throughput/total_tokens=1,193,664,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6218/500000] + train/ActionNoiseL2Loss=0.0867 + throughput/total_tokens=1,193,856,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6219/500000] + train/ActionNoiseL2Loss=0.1192 + throughput/total_tokens=1,194,048,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6220/500000] + optim/total_grad_norm=1.182 + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=1,194,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6221/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=1,194,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6222/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,194,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6223/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=1,194,816,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6224/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=1,195,008,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6225/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=1,195,200,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6226/500000] + train/ActionNoiseL2Loss=0.1296 + throughput/total_tokens=1,195,392,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6227/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,195,584,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6228/500000] + train/ActionNoiseL2Loss=0.1209 + throughput/total_tokens=1,195,776,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6229/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=1,195,968,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6230/500000] + train/ActionNoiseL2Loss=0.1115 + throughput/total_tokens=1,196,160,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=6231/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,196,352,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6232/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=1,196,544,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6233/500000] + train/ActionNoiseL2Loss=0.0709 + throughput/total_tokens=1,196,736,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6234/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,196,928,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6235/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=1,197,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6236/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=1,197,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6237/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=1,197,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6238/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=1,197,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6239/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=1,197,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6240/500000] + optim/total_grad_norm=0.8900 + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,198,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6241/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,198,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6242/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,198,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6243/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,198,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6244/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,198,848,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6245/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=1,199,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6246/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=1,199,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6247/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=1,199,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6248/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=1,199,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6249/500000] + train/ActionNoiseL2Loss=0.1017 + throughput/total_tokens=1,199,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6250/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=1,200,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6251/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=1,200,192,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6252/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,200,384,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6253/500000] + train/ActionNoiseL2Loss=0.1039 + throughput/total_tokens=1,200,576,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6254/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=1,200,768,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6255/500000] + train/ActionNoiseL2Loss=0.1037 + throughput/total_tokens=1,200,960,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6256/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,201,152,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6257/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,201,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6258/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=1,201,536,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6259/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,201,728,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6260/500000] + optim/total_grad_norm=1.104 + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,201,920,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6261/500000] + train/ActionNoiseL2Loss=0.0910 + throughput/total_tokens=1,202,112,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6262/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=1,202,304,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6263/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,202,496,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6264/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,202,688,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6265/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,202,880,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6266/500000] + train/ActionNoiseL2Loss=0.0410 + throughput/total_tokens=1,203,072,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6267/500000] + train/ActionNoiseL2Loss=0.1340 + throughput/total_tokens=1,203,264,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6268/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,203,456,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6269/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,203,648,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6270/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,203,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6271/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,204,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6272/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,204,224,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6273/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,204,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6274/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,204,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6275/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=1,204,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6276/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,204,992,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6277/500000] + train/ActionNoiseL2Loss=0.0863 + throughput/total_tokens=1,205,184,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6278/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=1,205,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6279/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,205,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6280/500000] + optim/total_grad_norm=0.7072 + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,205,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6281/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=1,205,952,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6282/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=1,206,144,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6283/500000] + train/ActionNoiseL2Loss=0.0915 + throughput/total_tokens=1,206,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6284/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,206,528,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6285/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=1,206,720,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6286/500000] + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=1,206,912,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6287/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,207,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6288/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=1,207,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6289/500000] + train/ActionNoiseL2Loss=0.0877 + throughput/total_tokens=1,207,488,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6290/500000] + train/ActionNoiseL2Loss=0.0230 + throughput/total_tokens=1,207,680,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6291/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,207,872,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6292/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=1,208,064,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6293/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=1,208,256,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6294/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=1,208,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6295/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,208,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6296/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,208,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6297/500000] + train/ActionNoiseL2Loss=0.1211 + throughput/total_tokens=1,209,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6298/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=1,209,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6299/500000] + train/ActionNoiseL2Loss=0.1001 + throughput/total_tokens=1,209,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6300/500000] + optim/total_grad_norm=0.9944 + train/ActionNoiseL2Loss=0.1094 + throughput/total_tokens=1,209,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6301/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=1,209,792,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6302/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=1,209,984,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6303/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=1,210,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6304/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,210,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6305/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,210,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6306/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=1,210,752,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6307/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,210,944,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6308/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,211,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6309/500000] + train/ActionNoiseL2Loss=0.0285 + throughput/total_tokens=1,211,328,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6310/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=1,211,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6311/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,211,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6312/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,211,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6313/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,212,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6314/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,212,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6315/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=1,212,480,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6316/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,212,672,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6317/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,212,864,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6318/500000] + train/ActionNoiseL2Loss=0.0931 + throughput/total_tokens=1,213,056,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6319/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,213,248,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6320/500000] + optim/total_grad_norm=1.032 + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=1,213,440,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6321/500000] + train/ActionNoiseL2Loss=0.0848 + throughput/total_tokens=1,213,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6322/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=1,213,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6323/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,214,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6324/500000] + train/ActionNoiseL2Loss=0.1013 + throughput/total_tokens=1,214,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6325/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,214,400,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6326/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,214,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6327/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,214,784,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6328/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,214,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6329/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,215,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6330/500000] + train/ActionNoiseL2Loss=0.1160 + throughput/total_tokens=1,215,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6331/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=1,215,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6332/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,215,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6333/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=1,215,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6334/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=1,216,128,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6335/500000] + train/ActionNoiseL2Loss=0.1139 + throughput/total_tokens=1,216,320,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6336/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,216,512,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6337/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=1,216,704,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6338/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=1,216,896,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6339/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,217,088,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6340/500000] + optim/total_grad_norm=0.9988 + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,217,280,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=6341/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,217,472,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6342/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=1,217,664,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6343/500000] + train/ActionNoiseL2Loss=0.0996 + throughput/total_tokens=1,217,856,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6344/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,218,048,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6345/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,218,240,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6346/500000] + train/ActionNoiseL2Loss=0.1178 + throughput/total_tokens=1,218,432,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6347/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,218,624,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6348/500000] + train/ActionNoiseL2Loss=0.1004 + throughput/total_tokens=1,218,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6349/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,219,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6350/500000] + train/ActionNoiseL2Loss=0.1051 + throughput/total_tokens=1,219,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=6351/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,219,392,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6352/500000] + train/ActionNoiseL2Loss=0.0946 + throughput/total_tokens=1,219,584,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6353/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,219,776,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6354/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,219,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6355/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,220,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6356/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=1,220,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6357/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=1,220,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6358/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=1,220,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6359/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=1,220,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6360/500000] + optim/total_grad_norm=1.465 + train/ActionNoiseL2Loss=0.0947 + throughput/total_tokens=1,221,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6361/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=1,221,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6362/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,221,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6363/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=1,221,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6364/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=1,221,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6365/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=1,222,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6366/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,222,272,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6367/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=1,222,464,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6368/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=1,222,656,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6369/500000] + train/ActionNoiseL2Loss=0.0928 + throughput/total_tokens=1,222,848,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6370/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,223,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6371/500000] + train/ActionNoiseL2Loss=0.0892 + throughput/total_tokens=1,223,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6372/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=1,223,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6373/500000] + train/ActionNoiseL2Loss=0.0941 + throughput/total_tokens=1,223,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6374/500000] + train/ActionNoiseL2Loss=0.0332 + throughput/total_tokens=1,223,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6375/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,224,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6376/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=1,224,192,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6377/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=1,224,384,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6378/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,224,576,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6379/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,224,768,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6380/500000] + optim/total_grad_norm=1.058 + train/ActionNoiseL2Loss=0.1099 + throughput/total_tokens=1,224,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=6381/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,225,152,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6382/500000] + train/ActionNoiseL2Loss=0.0236 + throughput/total_tokens=1,225,344,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6383/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=1,225,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6384/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=1,225,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6385/500000] + train/ActionNoiseL2Loss=0.0359 + throughput/total_tokens=1,225,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6386/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,226,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6387/500000] + train/ActionNoiseL2Loss=0.0388 + throughput/total_tokens=1,226,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6388/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=1,226,496,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6389/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=1,226,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6390/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,226,880,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6391/500000] + train/ActionNoiseL2Loss=0.1195 + throughput/total_tokens=1,227,072,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6392/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,227,264,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6393/500000] + train/ActionNoiseL2Loss=0.1394 + throughput/total_tokens=1,227,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6394/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,227,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6395/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=1,227,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6396/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,228,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6397/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,228,224,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6398/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,228,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6399/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,228,608,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6400/500000] + optim/total_grad_norm=0.7986 + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,228,800,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6401/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,228,992,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6402/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=1,229,184,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6403/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=1,229,376,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6404/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,229,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6405/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,229,760,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6406/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=1,229,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6407/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=1,230,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6408/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,230,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6409/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,230,528,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6410/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,230,720,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6411/500000] + train/ActionNoiseL2Loss=0.0865 + throughput/total_tokens=1,230,912,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6412/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=1,231,104,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6413/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=1,231,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6414/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=1,231,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6415/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,231,680,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6416/500000] + train/ActionNoiseL2Loss=0.0843 + throughput/total_tokens=1,231,872,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6417/500000] + train/ActionNoiseL2Loss=0.0973 + throughput/total_tokens=1,232,064,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6418/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,232,256,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6419/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,232,448,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6420/500000] + optim/total_grad_norm=1.064 + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=1,232,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6421/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,232,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6422/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,233,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6423/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=1,233,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6424/500000] + train/ActionNoiseL2Loss=0.0271 + throughput/total_tokens=1,233,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6425/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=1,233,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6426/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=1,233,792,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6427/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,233,984,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6428/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=1,234,176,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6429/500000] + train/ActionNoiseL2Loss=0.0832 + throughput/total_tokens=1,234,368,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6430/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=1,234,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6431/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,234,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6432/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,234,944,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6433/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=1,235,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6434/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,235,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6435/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=1,235,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6436/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,235,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6437/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,235,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6438/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,236,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6439/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,236,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6440/500000] + optim/total_grad_norm=0.8735 + train/ActionNoiseL2Loss=0.0772 + throughput/total_tokens=1,236,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6441/500000] + train/ActionNoiseL2Loss=0.0237 + throughput/total_tokens=1,236,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6442/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,236,864,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6443/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=1,237,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6444/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=1,237,248,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6445/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,237,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6446/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,237,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6447/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,237,824,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6448/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,238,016,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6449/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=1,238,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6450/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=1,238,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6451/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=1,238,592,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6452/500000] + train/ActionNoiseL2Loss=0.0387 + throughput/total_tokens=1,238,784,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6453/500000] + train/ActionNoiseL2Loss=0.1114 + throughput/total_tokens=1,238,976,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6454/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=1,239,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6455/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=1,239,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6456/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,239,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6457/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,239,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6458/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,239,936,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6459/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=1,240,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6460/500000] + optim/total_grad_norm=1.486 + train/ActionNoiseL2Loss=0.1258 + throughput/total_tokens=1,240,320,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6461/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=1,240,512,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6462/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=1,240,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6463/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,240,896,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6464/500000] + train/ActionNoiseL2Loss=0.0264 + throughput/total_tokens=1,241,088,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6465/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=1,241,280,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6466/500000] + train/ActionNoiseL2Loss=0.0948 + throughput/total_tokens=1,241,472,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6467/500000] + train/ActionNoiseL2Loss=0.0939 + throughput/total_tokens=1,241,664,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6468/500000] + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=1,241,856,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6469/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=1,242,048,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6470/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=1,242,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6471/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=1,242,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6472/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=1,242,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6473/500000] + train/ActionNoiseL2Loss=0.0772 + throughput/total_tokens=1,242,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6474/500000] + train/ActionNoiseL2Loss=0.0948 + throughput/total_tokens=1,243,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6475/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=1,243,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6476/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=1,243,392,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6477/500000] + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=1,243,584,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6478/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=1,243,776,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6479/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,243,968,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6480/500000] + optim/total_grad_norm=0.9250 + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,244,160,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6481/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=1,244,352,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6482/500000] + train/ActionNoiseL2Loss=0.0266 + throughput/total_tokens=1,244,544,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6483/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,244,736,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6484/500000] + train/ActionNoiseL2Loss=0.0910 + throughput/total_tokens=1,244,928,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6485/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=1,245,120,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6486/500000] + train/ActionNoiseL2Loss=0.0941 + throughput/total_tokens=1,245,312,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6487/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=1,245,504,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6488/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,245,696,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6489/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=1,245,888,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6490/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=1,246,080,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6491/500000] + train/ActionNoiseL2Loss=0.1199 + throughput/total_tokens=1,246,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6492/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=1,246,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6493/500000] + train/ActionNoiseL2Loss=0.0185 + throughput/total_tokens=1,246,656,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6494/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=1,246,848,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6495/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,247,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6496/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=1,247,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6497/500000] + train/ActionNoiseL2Loss=0.0809 + throughput/total_tokens=1,247,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6498/500000] + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=1,247,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6499/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=1,247,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6500/500000] + optim/total_grad_norm=0.9355 + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=1,248,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +10/13 [07:24:56] INFO | >> Saving config... checkpoint.py:608 +10/13 [07:25:40] INFO | >> Saving model state... checkpoint.py:796 +10/13 [07:26:51] INFO | >> Saving optim state... checkpoint.py:811 +10/13 [07:28:22] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=6501/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=1,248,192,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6502/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=1,248,384,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6503/500000] + train/ActionNoiseL2Loss=0.0325 + throughput/total_tokens=1,248,576,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6504/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,248,768,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6505/500000] + train/ActionNoiseL2Loss=0.0934 + throughput/total_tokens=1,248,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6506/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=1,249,152,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6507/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,249,344,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6508/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=1,249,536,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6509/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,249,728,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6510/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=1,249,920,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6511/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=1,250,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6512/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,250,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6513/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=1,250,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6514/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=1,250,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6515/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=1,250,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6516/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=1,251,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6517/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=1,251,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6518/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,251,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6519/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,251,648,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6520/500000] + optim/total_grad_norm=1.717 + train/ActionNoiseL2Loss=0.1253 + throughput/total_tokens=1,251,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6521/500000] + train/ActionNoiseL2Loss=0.0906 + throughput/total_tokens=1,252,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6522/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,252,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6523/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=1,252,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6524/500000] + train/ActionNoiseL2Loss=0.0285 + throughput/total_tokens=1,252,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6525/500000] + train/ActionNoiseL2Loss=0.0168 + throughput/total_tokens=1,252,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6526/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,252,992,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6527/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=1,253,184,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6528/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,253,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6529/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,253,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6530/500000] + train/ActionNoiseL2Loss=0.0871 + throughput/total_tokens=1,253,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6531/500000] + train/ActionNoiseL2Loss=0.0879 + throughput/total_tokens=1,253,952,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6532/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=1,254,144,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6533/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=1,254,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6534/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,254,528,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6535/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,254,720,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6536/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=1,254,912,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6537/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=1,255,104,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6538/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=1,255,296,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6539/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=1,255,488,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6540/500000] + optim/total_grad_norm=1.077 + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,255,680,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6541/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,255,872,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6542/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=1,256,064,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6543/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,256,256,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6544/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,256,448,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6545/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=1,256,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6546/500000] + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=1,256,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6547/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,257,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6548/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=1,257,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6549/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,257,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6550/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=1,257,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6551/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=1,257,792,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6552/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,257,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6553/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=1,258,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6554/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=1,258,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6555/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=1,258,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6556/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=1,258,752,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6557/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=1,258,944,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6558/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,259,136,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6559/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=1,259,328,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6560/500000] + optim/total_grad_norm=1.250 + train/ActionNoiseL2Loss=0.0911 + throughput/total_tokens=1,259,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6561/500000] + train/ActionNoiseL2Loss=0.0924 + throughput/total_tokens=1,259,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6562/500000] + train/ActionNoiseL2Loss=0.0310 + throughput/total_tokens=1,259,904,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6563/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=1,260,096,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6564/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=1,260,288,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6565/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,260,480,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6566/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=1,260,672,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6567/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=1,260,864,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6568/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=1,261,056,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6569/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=1,261,248,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6570/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=1,261,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6571/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,261,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6572/500000] + train/ActionNoiseL2Loss=0.0388 + throughput/total_tokens=1,261,824,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6573/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,262,016,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6574/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=1,262,208,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6575/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=1,262,400,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6576/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=1,262,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6577/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=1,262,784,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6578/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,262,976,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6579/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=1,263,168,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6580/500000] + optim/total_grad_norm=0.9071 + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=1,263,360,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6581/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=1,263,552,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6582/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=1,263,744,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6583/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,263,936,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6584/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,264,128,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6585/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=1,264,320,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6586/500000] + train/ActionNoiseL2Loss=0.1017 + throughput/total_tokens=1,264,512,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6587/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,264,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6588/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=1,264,896,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6589/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=1,265,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6590/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=1,265,280,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6591/500000] + train/ActionNoiseL2Loss=0.1100 + throughput/total_tokens=1,265,472,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6592/500000] + train/ActionNoiseL2Loss=0.0955 + throughput/total_tokens=1,265,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6593/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=1,265,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6594/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=1,266,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6595/500000] + train/ActionNoiseL2Loss=0.0915 + throughput/total_tokens=1,266,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6596/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,266,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6597/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=1,266,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6598/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,266,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6599/500000] + train/ActionNoiseL2Loss=0.0999 + throughput/total_tokens=1,267,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6600/500000] + optim/total_grad_norm=1.723 + train/ActionNoiseL2Loss=0.0901 + throughput/total_tokens=1,267,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6601/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=1,267,392,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6602/500000] + train/ActionNoiseL2Loss=0.0868 + throughput/total_tokens=1,267,584,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6603/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=1,267,776,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6604/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,267,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6605/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=1,268,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6606/500000] + train/ActionNoiseL2Loss=0.0986 + throughput/total_tokens=1,268,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6607/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,268,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6608/500000] + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=1,268,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6609/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=1,268,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6610/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=1,269,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6611/500000] + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=1,269,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6612/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,269,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6613/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=1,269,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6614/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,269,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6615/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,270,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6616/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=1,270,272,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6617/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,270,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6618/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,270,656,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6619/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=1,270,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6620/500000] + optim/total_grad_norm=1.034 + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=1,271,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6621/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=1,271,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6622/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=1,271,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6623/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,271,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6624/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=1,271,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6625/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=1,272,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6626/500000] + train/ActionNoiseL2Loss=0.0931 + throughput/total_tokens=1,272,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6627/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,272,384,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6628/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=1,272,576,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6629/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=1,272,768,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6630/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,272,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6631/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=1,273,152,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6632/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,273,344,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6633/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,273,536,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6634/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=1,273,728,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6635/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,273,920,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6636/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,274,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6637/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=1,274,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6638/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=1,274,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6639/500000] + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=1,274,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6640/500000] + optim/total_grad_norm=0.6913 + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,274,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=6641/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=1,275,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6642/500000] + train/ActionNoiseL2Loss=0.0293 + throughput/total_tokens=1,275,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6643/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=1,275,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6644/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,275,648,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6645/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=1,275,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6646/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,276,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6647/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=1,276,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6648/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,276,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6649/500000] + train/ActionNoiseL2Loss=0.1048 + throughput/total_tokens=1,276,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6650/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,276,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6651/500000] + train/ActionNoiseL2Loss=0.0980 + throughput/total_tokens=1,276,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6652/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=1,277,184,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6653/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,277,376,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6654/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=1,277,568,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6655/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,277,760,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6656/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,277,952,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6657/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,278,144,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6658/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=1,278,336,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6659/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,278,528,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6660/500000] + optim/total_grad_norm=0.5230 + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,278,720,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6661/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,278,912,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6662/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,279,104,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6663/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,279,296,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6664/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=1,279,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6665/500000] + train/ActionNoiseL2Loss=0.0858 + throughput/total_tokens=1,279,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6666/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=1,279,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6667/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=1,280,064,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6668/500000] + train/ActionNoiseL2Loss=0.1040 + throughput/total_tokens=1,280,256,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6669/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=1,280,448,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6670/500000] + train/ActionNoiseL2Loss=0.0297 + throughput/total_tokens=1,280,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6671/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,280,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6672/500000] + train/ActionNoiseL2Loss=0.1238 + throughput/total_tokens=1,281,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6673/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=1,281,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6674/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,281,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6675/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=1,281,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6676/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=1,281,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6677/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=1,281,984,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6678/500000] + train/ActionNoiseL2Loss=0.1030 + throughput/total_tokens=1,282,176,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6679/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=1,282,368,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6680/500000] + optim/total_grad_norm=0.7677 + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=1,282,560,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6681/500000] + train/ActionNoiseL2Loss=0.1120 + throughput/total_tokens=1,282,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6682/500000] + train/ActionNoiseL2Loss=0.0874 + throughput/total_tokens=1,282,944,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6683/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=1,283,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6684/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,283,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6685/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=1,283,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6686/500000] + train/ActionNoiseL2Loss=0.0776 + throughput/total_tokens=1,283,712,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6687/500000] + train/ActionNoiseL2Loss=0.0874 + throughput/total_tokens=1,283,904,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6688/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=1,284,096,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6689/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,284,288,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6690/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,284,480,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=6691/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,284,672,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6692/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=1,284,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6693/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=1,285,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6694/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=1,285,248,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6695/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,285,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6696/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=1,285,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6697/500000] + train/ActionNoiseL2Loss=0.1427 + throughput/total_tokens=1,285,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6698/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=1,286,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6699/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=1,286,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6700/500000] + optim/total_grad_norm=0.9746 + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,286,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6701/500000] + train/ActionNoiseL2Loss=0.0959 + throughput/total_tokens=1,286,592,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6702/500000] + train/ActionNoiseL2Loss=0.1355 + throughput/total_tokens=1,286,784,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6703/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,286,976,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6704/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,287,168,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6705/500000] + train/ActionNoiseL2Loss=0.1437 + throughput/total_tokens=1,287,360,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6706/500000] + train/ActionNoiseL2Loss=0.0871 + throughput/total_tokens=1,287,552,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6707/500000] + train/ActionNoiseL2Loss=0.0251 + throughput/total_tokens=1,287,744,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6708/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,287,936,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6709/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=1,288,128,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6710/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,288,320,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6711/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,288,512,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6712/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,288,704,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6713/500000] + train/ActionNoiseL2Loss=0.0901 + throughput/total_tokens=1,288,896,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6714/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,289,088,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6715/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,289,280,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6716/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,289,472,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6717/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,289,664,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6718/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=1,289,856,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6719/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,290,048,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6720/500000] + optim/total_grad_norm=0.9082 + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=1,290,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6721/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=1,290,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6722/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,290,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6723/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,290,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6724/500000] + train/ActionNoiseL2Loss=0.0884 + throughput/total_tokens=1,291,008,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6725/500000] + train/ActionNoiseL2Loss=0.0843 + throughput/total_tokens=1,291,200,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6726/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=1,291,392,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6727/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,291,584,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6728/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,291,776,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6729/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,291,968,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6730/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,292,160,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6731/500000] + train/ActionNoiseL2Loss=0.0930 + throughput/total_tokens=1,292,352,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6732/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,292,544,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6733/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=1,292,736,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6734/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=1,292,928,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6735/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=1,293,120,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6736/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,293,312,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6737/500000] + train/ActionNoiseL2Loss=0.1092 + throughput/total_tokens=1,293,504,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6738/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,293,696,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6739/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,293,888,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6740/500000] + optim/total_grad_norm=0.6800 + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=1,294,080,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6741/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=1,294,272,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6742/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,294,464,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6743/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=1,294,656,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6744/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=1,294,848,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6745/500000] + train/ActionNoiseL2Loss=0.1425 + throughput/total_tokens=1,295,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6746/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,295,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6747/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=1,295,424,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6748/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,295,616,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6749/500000] + train/ActionNoiseL2Loss=0.0886 + throughput/total_tokens=1,295,808,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6750/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=1,296,000,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6751/500000] + train/ActionNoiseL2Loss=0.1066 + throughput/total_tokens=1,296,192,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6752/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,296,384,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6753/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,296,576,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6754/500000] + train/ActionNoiseL2Loss=0.0363 + throughput/total_tokens=1,296,768,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6755/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,296,960,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6756/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,297,152,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6757/500000] + train/ActionNoiseL2Loss=0.0241 + throughput/total_tokens=1,297,344,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6758/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=1,297,536,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6759/500000] + train/ActionNoiseL2Loss=0.1251 + throughput/total_tokens=1,297,728,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6760/500000] + optim/total_grad_norm=0.8191 + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=1,297,920,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=6761/500000] + train/ActionNoiseL2Loss=0.1738 + throughput/total_tokens=1,298,112,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6762/500000] + train/ActionNoiseL2Loss=0.1097 + throughput/total_tokens=1,298,304,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6763/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=1,298,496,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6764/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=1,298,688,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6765/500000] + train/ActionNoiseL2Loss=0.1143 + throughput/total_tokens=1,298,880,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6766/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,299,072,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6767/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=1,299,264,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6768/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,299,456,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6769/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,299,648,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6770/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=1,299,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6771/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,300,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6772/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,300,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6773/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,300,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6774/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,300,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6775/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,300,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6776/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,300,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6777/500000] + train/ActionNoiseL2Loss=0.1108 + throughput/total_tokens=1,301,184,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6778/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=1,301,376,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6779/500000] + train/ActionNoiseL2Loss=0.1104 + throughput/total_tokens=1,301,568,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6780/500000] + optim/total_grad_norm=0.9782 + train/ActionNoiseL2Loss=0.0927 + throughput/total_tokens=1,301,760,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6781/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,301,952,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6782/500000] + train/ActionNoiseL2Loss=0.0940 + throughput/total_tokens=1,302,144,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6783/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,302,336,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6784/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=1,302,528,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6785/500000] + train/ActionNoiseL2Loss=0.1454 + throughput/total_tokens=1,302,720,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6786/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,302,912,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6787/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=1,303,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6788/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=1,303,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6789/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,303,488,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6790/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=1,303,680,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6791/500000] + train/ActionNoiseL2Loss=0.0957 + throughput/total_tokens=1,303,872,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6792/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,304,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6793/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=1,304,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6794/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,304,448,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6795/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=1,304,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6796/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=1,304,832,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6797/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=1,305,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6798/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=1,305,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6799/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=1,305,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6800/500000] + optim/total_grad_norm=1.267 + train/ActionNoiseL2Loss=0.0871 + throughput/total_tokens=1,305,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6801/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=1,305,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6802/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=1,305,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6803/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,306,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6804/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=1,306,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6805/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=1,306,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6806/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=1,306,752,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6807/500000] + train/ActionNoiseL2Loss=0.1197 + throughput/total_tokens=1,306,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6808/500000] + train/ActionNoiseL2Loss=0.0881 + throughput/total_tokens=1,307,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6809/500000] + train/ActionNoiseL2Loss=0.1173 + throughput/total_tokens=1,307,328,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6810/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=1,307,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6811/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,307,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6812/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,307,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6813/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,308,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6814/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,308,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6815/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,308,480,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6816/500000] + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=1,308,672,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6817/500000] + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=1,308,864,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6818/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=1,309,056,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6819/500000] + train/ActionNoiseL2Loss=0.0741 + throughput/total_tokens=1,309,248,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6820/500000] + optim/total_grad_norm=0.5340 + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,309,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6821/500000] + train/ActionNoiseL2Loss=0.1159 + throughput/total_tokens=1,309,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6822/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,309,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6823/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=1,310,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6824/500000] + train/ActionNoiseL2Loss=0.1100 + throughput/total_tokens=1,310,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6825/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=1,310,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6826/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=1,310,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6827/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,310,784,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6828/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=1,310,976,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6829/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,311,168,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6830/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=1,311,360,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6831/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=1,311,552,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6832/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=1,311,744,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6833/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,311,936,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6834/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=1,312,128,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6835/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,312,320,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6836/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,312,512,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6837/500000] + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=1,312,704,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6838/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=1,312,896,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6839/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,313,088,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6840/500000] + optim/total_grad_norm=0.7608 + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=1,313,280,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6841/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=1,313,472,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6842/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=1,313,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6843/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,313,856,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6844/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=1,314,048,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6845/500000] + train/ActionNoiseL2Loss=0.0898 + throughput/total_tokens=1,314,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6846/500000] + train/ActionNoiseL2Loss=0.0332 + throughput/total_tokens=1,314,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6847/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=1,314,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6848/500000] + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=1,314,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6849/500000] + train/ActionNoiseL2Loss=0.0840 + throughput/total_tokens=1,315,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6850/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,315,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6851/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=1,315,392,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6852/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=1,315,584,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6853/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,315,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6854/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=1,315,968,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6855/500000] + train/ActionNoiseL2Loss=0.1004 + throughput/total_tokens=1,316,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6856/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=1,316,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6857/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,316,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6858/500000] + train/ActionNoiseL2Loss=0.0325 + throughput/total_tokens=1,316,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6859/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=1,316,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6860/500000] + optim/total_grad_norm=0.5269 + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=1,317,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6861/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,317,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6862/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,317,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6863/500000] + train/ActionNoiseL2Loss=0.1134 + throughput/total_tokens=1,317,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6864/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=1,317,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6865/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,318,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6866/500000] + train/ActionNoiseL2Loss=0.1032 + throughput/total_tokens=1,318,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6867/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=1,318,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6868/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=1,318,656,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6869/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=1,318,848,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6870/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=1,319,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6871/500000] + train/ActionNoiseL2Loss=0.0931 + throughput/total_tokens=1,319,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6872/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,319,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6873/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,319,616,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6874/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,319,808,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6875/500000] + train/ActionNoiseL2Loss=0.0901 + throughput/total_tokens=1,320,000,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6876/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,320,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6877/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,320,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6878/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,320,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6879/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=1,320,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6880/500000] + optim/total_grad_norm=0.6034 + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,320,960,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6881/500000] + train/ActionNoiseL2Loss=0.0963 + throughput/total_tokens=1,321,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6882/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=1,321,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6883/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=1,321,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6884/500000] + train/ActionNoiseL2Loss=0.0772 + throughput/total_tokens=1,321,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6885/500000] + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=1,321,920,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6886/500000] + train/ActionNoiseL2Loss=0.1080 + throughput/total_tokens=1,322,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6887/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,322,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6888/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,322,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6889/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,322,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6890/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=1,322,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6891/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,323,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6892/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,323,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6893/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,323,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6894/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=1,323,648,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6895/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,323,840,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6896/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,324,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6897/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=1,324,224,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6898/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=1,324,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6899/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,324,608,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6900/500000] + optim/total_grad_norm=0.8074 + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=1,324,800,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=6901/500000] + train/ActionNoiseL2Loss=0.0859 + throughput/total_tokens=1,324,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6902/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=1,325,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6903/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=1,325,376,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6904/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=1,325,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6905/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=1,325,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6906/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=1,325,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6907/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,326,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6908/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,326,336,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6909/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=1,326,528,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6910/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,326,720,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=6911/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,326,912,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6912/500000] + train/ActionNoiseL2Loss=0.0338 + throughput/total_tokens=1,327,104,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6913/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,327,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6914/500000] + train/ActionNoiseL2Loss=0.0892 + throughput/total_tokens=1,327,488,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6915/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,327,680,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6916/500000] + train/ActionNoiseL2Loss=0.1022 + throughput/total_tokens=1,327,872,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6917/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=1,328,064,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6918/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=1,328,256,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6919/500000] + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=1,328,448,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6920/500000] + optim/total_grad_norm=1.749 + train/ActionNoiseL2Loss=0.1102 + throughput/total_tokens=1,328,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6921/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,328,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6922/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,329,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6923/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=1,329,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6924/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,329,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6925/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=1,329,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6926/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,329,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6927/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=1,329,984,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6928/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,330,176,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6929/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,330,368,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6930/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,330,560,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6931/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=1,330,752,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6932/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=1,330,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6933/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=1,331,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6934/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=1,331,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6935/500000] + train/ActionNoiseL2Loss=0.0385 + throughput/total_tokens=1,331,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6936/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,331,712,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6937/500000] + train/ActionNoiseL2Loss=0.0245 + throughput/total_tokens=1,331,904,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6938/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=1,332,096,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6939/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,332,288,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6940/500000] + optim/total_grad_norm=0.6471 + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=1,332,480,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=6941/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=1,332,672,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6942/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,332,864,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6943/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,333,056,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6944/500000] + train/ActionNoiseL2Loss=0.0925 + throughput/total_tokens=1,333,248,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6945/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,333,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6946/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=1,333,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6947/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,333,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6948/500000] + train/ActionNoiseL2Loss=0.0802 + throughput/total_tokens=1,334,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6949/500000] + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=1,334,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=6950/500000] + train/ActionNoiseL2Loss=0.0219 + throughput/total_tokens=1,334,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6951/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=1,334,592,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6952/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,334,784,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=6953/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,334,976,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6954/500000] + train/ActionNoiseL2Loss=0.0332 + throughput/total_tokens=1,335,168,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6955/500000] + train/ActionNoiseL2Loss=0.0747 + throughput/total_tokens=1,335,360,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6956/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=1,335,552,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6957/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=1,335,744,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6958/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=1,335,936,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6959/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,336,128,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6960/500000] + optim/total_grad_norm=0.5157 + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,336,320,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=6961/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,336,512,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6962/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,336,704,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6963/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=1,336,896,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6964/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=1,337,088,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6965/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,337,280,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6966/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=1,337,472,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6967/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,337,664,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=6968/500000] + train/ActionNoiseL2Loss=0.0836 + throughput/total_tokens=1,337,856,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6969/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=1,338,048,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=6970/500000] + train/ActionNoiseL2Loss=0.1193 + throughput/total_tokens=1,338,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6971/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=1,338,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6972/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=1,338,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6973/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,338,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6974/500000] + train/ActionNoiseL2Loss=0.1295 + throughput/total_tokens=1,339,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6975/500000] + train/ActionNoiseL2Loss=0.0249 + throughput/total_tokens=1,339,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6976/500000] + train/ActionNoiseL2Loss=0.0268 + throughput/total_tokens=1,339,392,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6977/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=1,339,584,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6978/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=1,339,776,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6979/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=1,339,968,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6980/500000] + optim/total_grad_norm=1.322 + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=1,340,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6981/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=1,340,352,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6982/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,340,544,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=6983/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,340,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6984/500000] + train/ActionNoiseL2Loss=0.0851 + throughput/total_tokens=1,340,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6985/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,341,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=6986/500000] + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=1,341,312,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6987/500000] + train/ActionNoiseL2Loss=0.0290 + throughput/total_tokens=1,341,504,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6988/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,341,696,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=6989/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,341,888,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6990/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,342,080,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=6991/500000] + train/ActionNoiseL2Loss=0.0970 + throughput/total_tokens=1,342,272,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6992/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,342,464,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6993/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,342,656,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6994/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=1,342,848,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6995/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=1,343,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=6996/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,343,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=6997/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,343,424,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6998/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=1,343,616,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=6999/500000] + train/ActionNoiseL2Loss=0.1059 + throughput/total_tokens=1,343,808,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7000/500000] + optim/total_grad_norm=1.014 + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,344,000,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +10/13 [10:23:55] INFO | >> Saving config... checkpoint.py:608 +10/13 [10:24:40] INFO | >> Saving model state... checkpoint.py:796 +10/13 [10:25:51] INFO | >> Saving optim state... checkpoint.py:811 +10/13 [10:27:22] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=7001/500000] + train/ActionNoiseL2Loss=0.1142 + throughput/total_tokens=1,344,192,000 + throughput/device/tokens_per_second=1,130 + throughput/device/batches_per_second=0.0471 +[step=7002/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,344,384,000 + throughput/device/tokens_per_second=1,127 + throughput/device/batches_per_second=0.0470 +[step=7003/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,344,576,000 + throughput/device/tokens_per_second=1,115 + throughput/device/batches_per_second=0.0465 +[step=7004/500000] + train/ActionNoiseL2Loss=0.0818 + throughput/total_tokens=1,344,768,000 + throughput/device/tokens_per_second=1,123 + throughput/device/batches_per_second=0.0468 +[step=7005/500000] + train/ActionNoiseL2Loss=0.0276 + throughput/total_tokens=1,344,960,000 + throughput/device/tokens_per_second=1,127 + throughput/device/batches_per_second=0.0470 +[step=7006/500000] + train/ActionNoiseL2Loss=0.0851 + throughput/total_tokens=1,345,152,000 + throughput/device/tokens_per_second=1,132 + throughput/device/batches_per_second=0.0472 +[step=7007/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,345,344,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=7008/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=1,345,536,000 + throughput/device/tokens_per_second=1,136 + throughput/device/batches_per_second=0.0473 +[step=7009/500000] + train/ActionNoiseL2Loss=0.0286 + throughput/total_tokens=1,345,728,000 + throughput/device/tokens_per_second=1,136 + throughput/device/batches_per_second=0.0474 +[step=7010/500000] + train/ActionNoiseL2Loss=0.1182 + throughput/total_tokens=1,345,920,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0474 + System/Peak GPU Memory (MB)=51,076 +[step=7011/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=1,346,112,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=7012/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=1,346,304,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=7013/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=1,346,496,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=7014/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,346,688,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=7015/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=1,346,880,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=7016/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,347,072,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=7017/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=1,347,264,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=7018/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=1,347,456,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=7019/500000] + train/ActionNoiseL2Loss=0.0284 + throughput/total_tokens=1,347,648,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=7020/500000] + optim/total_grad_norm=0.5421 + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,347,840,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 + System/Peak GPU Memory (MB)=51,076 +[step=7021/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,348,032,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7022/500000] + train/ActionNoiseL2Loss=0.1073 + throughput/total_tokens=1,348,224,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7023/500000] + train/ActionNoiseL2Loss=0.1262 + throughput/total_tokens=1,348,416,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7024/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=1,348,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7025/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=1,348,800,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7026/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=1,348,992,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7027/500000] + train/ActionNoiseL2Loss=0.0344 + throughput/total_tokens=1,349,184,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7028/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,349,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7029/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,349,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7030/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,349,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7031/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,349,952,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7032/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,350,144,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7033/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,350,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7034/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,350,528,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7035/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=1,350,720,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7036/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=1,350,912,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7037/500000] + train/ActionNoiseL2Loss=0.0776 + throughput/total_tokens=1,351,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7038/500000] + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=1,351,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7039/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,351,488,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7040/500000] + optim/total_grad_norm=1.072 + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=1,351,680,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7041/500000] + train/ActionNoiseL2Loss=0.0809 + throughput/total_tokens=1,351,872,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7042/500000] + train/ActionNoiseL2Loss=0.0900 + throughput/total_tokens=1,352,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7043/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=1,352,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7044/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,352,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7045/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,352,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7046/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,352,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7047/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,353,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7048/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,353,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7049/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=1,353,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7050/500000] + train/ActionNoiseL2Loss=0.0914 + throughput/total_tokens=1,353,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7051/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,353,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7052/500000] + train/ActionNoiseL2Loss=0.1055 + throughput/total_tokens=1,353,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7053/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=1,354,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7054/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=1,354,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7055/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=1,354,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7056/500000] + train/ActionNoiseL2Loss=0.0879 + throughput/total_tokens=1,354,752,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7057/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=1,354,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7058/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,355,136,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7059/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=1,355,328,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7060/500000] + optim/total_grad_norm=0.5448 + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,355,520,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=7061/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=1,355,712,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7062/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=1,355,904,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7063/500000] + train/ActionNoiseL2Loss=0.0311 + throughput/total_tokens=1,356,096,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7064/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,356,288,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7065/500000] + train/ActionNoiseL2Loss=0.0309 + throughput/total_tokens=1,356,480,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7066/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=1,356,672,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7067/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,356,864,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7068/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,357,056,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7069/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=1,357,248,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7070/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=1,357,440,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=7071/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=1,357,632,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7072/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,357,824,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7073/500000] + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=1,358,016,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7074/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,358,208,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7075/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,358,400,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7076/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,358,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7077/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,358,784,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7078/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=1,358,976,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7079/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=1,359,168,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7080/500000] + optim/total_grad_norm=0.5597 + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=1,359,360,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=7081/500000] + train/ActionNoiseL2Loss=0.1172 + throughput/total_tokens=1,359,552,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7082/500000] + train/ActionNoiseL2Loss=0.0331 + throughput/total_tokens=1,359,744,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7083/500000] + train/ActionNoiseL2Loss=0.1333 + throughput/total_tokens=1,359,936,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7084/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=1,360,128,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7085/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=1,360,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7086/500000] + train/ActionNoiseL2Loss=0.0971 + throughput/total_tokens=1,360,512,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7087/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,360,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7088/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,360,896,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7089/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,361,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7090/500000] + train/ActionNoiseL2Loss=0.1045 + throughput/total_tokens=1,361,280,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7091/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=1,361,472,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7092/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,361,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7093/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,361,856,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7094/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,362,048,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7095/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,362,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7096/500000] + train/ActionNoiseL2Loss=0.0237 + throughput/total_tokens=1,362,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7097/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=1,362,624,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7098/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,362,816,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7099/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,363,008,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7100/500000] + optim/total_grad_norm=0.9139 + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=1,363,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7101/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=1,363,392,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7102/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,363,584,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7103/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,363,776,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7104/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=1,363,968,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7105/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,364,160,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=7106/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=1,364,352,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7107/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,364,544,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7108/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=1,364,736,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=7109/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,364,928,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=7110/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,365,120,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 + System/Peak GPU Memory (MB)=51,076 +[step=7111/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=1,365,312,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=7112/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,365,504,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=7113/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=1,365,696,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7114/500000] + train/ActionNoiseL2Loss=0.0935 + throughput/total_tokens=1,365,888,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7115/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=1,366,080,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7116/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,366,272,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7117/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,366,464,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7118/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=1,366,656,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7119/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,366,848,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7120/500000] + optim/total_grad_norm=1.166 + train/ActionNoiseL2Loss=0.0920 + throughput/total_tokens=1,367,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=7121/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=1,367,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7122/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,367,424,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7123/500000] + train/ActionNoiseL2Loss=0.0931 + throughput/total_tokens=1,367,616,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7124/500000] + train/ActionNoiseL2Loss=0.0924 + throughput/total_tokens=1,367,808,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7125/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=1,368,000,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7126/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,368,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7127/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,368,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7128/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=1,368,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7129/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=1,368,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7130/500000] + train/ActionNoiseL2Loss=0.0340 + throughput/total_tokens=1,368,960,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7131/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=1,369,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7132/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=1,369,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7133/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,369,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7134/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=1,369,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7135/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=1,369,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7136/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=1,370,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7137/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,370,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7138/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=1,370,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7139/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,370,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7140/500000] + optim/total_grad_norm=0.8662 + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,370,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7141/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=1,371,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7142/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=1,371,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7143/500000] + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=1,371,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7144/500000] + train/ActionNoiseL2Loss=0.0877 + throughput/total_tokens=1,371,648,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7145/500000] + train/ActionNoiseL2Loss=0.0824 + throughput/total_tokens=1,371,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7146/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=1,372,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7147/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=1,372,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7148/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=1,372,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7149/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,372,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7150/500000] + train/ActionNoiseL2Loss=0.0832 + throughput/total_tokens=1,372,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7151/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=1,372,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7152/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=1,373,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7153/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,373,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7154/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=1,373,568,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7155/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=1,373,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7156/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=1,373,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7157/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=1,374,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7158/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,374,336,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7159/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,374,528,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7160/500000] + optim/total_grad_norm=0.7149 + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,374,720,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=7161/500000] + train/ActionNoiseL2Loss=0.0895 + throughput/total_tokens=1,374,912,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7162/500000] + train/ActionNoiseL2Loss=0.0950 + throughput/total_tokens=1,375,104,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7163/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=1,375,296,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7164/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=1,375,488,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7165/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=1,375,680,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7166/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,375,872,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7167/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,376,064,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7168/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,376,256,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7169/500000] + train/ActionNoiseL2Loss=0.0961 + throughput/total_tokens=1,376,448,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7170/500000] + train/ActionNoiseL2Loss=0.0284 + throughput/total_tokens=1,376,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7171/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=1,376,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7172/500000] + train/ActionNoiseL2Loss=0.1015 + throughput/total_tokens=1,377,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7173/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=1,377,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7174/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,377,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7175/500000] + train/ActionNoiseL2Loss=0.1426 + throughput/total_tokens=1,377,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7176/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=1,377,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7177/500000] + train/ActionNoiseL2Loss=0.0234 + throughput/total_tokens=1,377,984,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7178/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=1,378,176,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7179/500000] + train/ActionNoiseL2Loss=0.0924 + throughput/total_tokens=1,378,368,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7180/500000] + optim/total_grad_norm=0.8852 + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,378,560,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7181/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=1,378,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7182/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=1,378,944,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7183/500000] + train/ActionNoiseL2Loss=0.0260 + throughput/total_tokens=1,379,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7184/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=1,379,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7185/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=1,379,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7186/500000] + train/ActionNoiseL2Loss=0.1093 + throughput/total_tokens=1,379,712,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7187/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,379,904,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7188/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=1,380,096,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7189/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,380,288,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7190/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=1,380,480,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7191/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=1,380,672,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7192/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,380,864,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7193/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=1,381,056,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7194/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=1,381,248,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7195/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,381,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7196/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,381,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7197/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,381,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7198/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,382,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7199/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,382,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7200/500000] + optim/total_grad_norm=1.688 + train/ActionNoiseL2Loss=0.1362 + throughput/total_tokens=1,382,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7201/500000] + train/ActionNoiseL2Loss=0.1327 + throughput/total_tokens=1,382,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7202/500000] + train/ActionNoiseL2Loss=0.1052 + throughput/total_tokens=1,382,784,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7203/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=1,382,976,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7204/500000] + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=1,383,168,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7205/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=1,383,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7206/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,383,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7207/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=1,383,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7208/500000] + train/ActionNoiseL2Loss=0.0972 + throughput/total_tokens=1,383,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7209/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,384,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7210/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,384,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7211/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,384,512,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7212/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=1,384,704,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7213/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,384,896,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7214/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,385,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7215/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,385,280,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7216/500000] + train/ActionNoiseL2Loss=0.0385 + throughput/total_tokens=1,385,472,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7217/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=1,385,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7218/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,385,856,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7219/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,386,048,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7220/500000] + optim/total_grad_norm=1.340 + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,386,240,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7221/500000] + train/ActionNoiseL2Loss=0.0915 + throughput/total_tokens=1,386,432,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7222/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=1,386,624,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7223/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=1,386,816,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7224/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,387,008,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7225/500000] + train/ActionNoiseL2Loss=0.0927 + throughput/total_tokens=1,387,200,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7226/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,387,392,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7227/500000] + train/ActionNoiseL2Loss=0.0990 + throughput/total_tokens=1,387,584,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7228/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=1,387,776,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7229/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=1,387,968,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7230/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=1,388,160,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7231/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,388,352,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7232/500000] + train/ActionNoiseL2Loss=0.0709 + throughput/total_tokens=1,388,544,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7233/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=1,388,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7234/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=1,388,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7235/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,389,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7236/500000] + train/ActionNoiseL2Loss=0.0902 + throughput/total_tokens=1,389,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7237/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,389,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7238/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,389,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7239/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,389,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7240/500000] + optim/total_grad_norm=0.7998 + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,390,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7241/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,390,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7242/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,390,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7243/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=1,390,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7244/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=1,390,848,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7245/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,391,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7246/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=1,391,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7247/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,391,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7248/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=1,391,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7249/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=1,391,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7250/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=1,392,000,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7251/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,392,192,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7252/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,392,384,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7253/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=1,392,576,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7254/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=1,392,768,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7255/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=1,392,960,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7256/500000] + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=1,393,152,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7257/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,393,344,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7258/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=1,393,536,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7259/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,393,728,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7260/500000] + optim/total_grad_norm=1.569 + train/ActionNoiseL2Loss=0.0969 + throughput/total_tokens=1,393,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7261/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,394,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7262/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,394,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7263/500000] + train/ActionNoiseL2Loss=0.0947 + throughput/total_tokens=1,394,496,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7264/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=1,394,688,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7265/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=1,394,880,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7266/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=1,395,072,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7267/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=1,395,264,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7268/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,395,456,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7269/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=1,395,648,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7270/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=1,395,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7271/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=1,396,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7272/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,396,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7273/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,396,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7274/500000] + train/ActionNoiseL2Loss=0.1010 + throughput/total_tokens=1,396,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7275/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=1,396,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7276/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=1,396,992,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7277/500000] + train/ActionNoiseL2Loss=0.1059 + throughput/total_tokens=1,397,184,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7278/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=1,397,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7279/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,397,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7280/500000] + optim/total_grad_norm=0.9151 + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=1,397,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7281/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=1,397,952,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7282/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=1,398,144,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7283/500000] + train/ActionNoiseL2Loss=0.0934 + throughput/total_tokens=1,398,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7284/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,398,528,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7285/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,398,720,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7286/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,398,912,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7287/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=1,399,104,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7288/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=1,399,296,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7289/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,399,488,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7290/500000] + train/ActionNoiseL2Loss=0.0313 + throughput/total_tokens=1,399,680,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7291/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=1,399,872,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7292/500000] + train/ActionNoiseL2Loss=0.0956 + throughput/total_tokens=1,400,064,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7293/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,400,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7294/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,400,448,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7295/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,400,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7296/500000] + train/ActionNoiseL2Loss=0.0848 + throughput/total_tokens=1,400,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7297/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=1,401,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7298/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=1,401,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7299/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=1,401,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7300/500000] + optim/total_grad_norm=0.8824 + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=1,401,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7301/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,401,792,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7302/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=1,401,984,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7303/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=1,402,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7304/500000] + train/ActionNoiseL2Loss=0.0982 + throughput/total_tokens=1,402,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7305/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=1,402,560,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7306/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=1,402,752,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7307/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,402,944,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7308/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,403,136,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7309/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=1,403,328,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7310/500000] + train/ActionNoiseL2Loss=0.0411 + throughput/total_tokens=1,403,520,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=7311/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=1,403,712,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7312/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=1,403,904,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7313/500000] + train/ActionNoiseL2Loss=0.1052 + throughput/total_tokens=1,404,096,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7314/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,404,288,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7315/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,404,480,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7316/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=1,404,672,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7317/500000] + train/ActionNoiseL2Loss=0.1073 + throughput/total_tokens=1,404,864,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7318/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,405,056,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7319/500000] + train/ActionNoiseL2Loss=0.0385 + throughput/total_tokens=1,405,248,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7320/500000] + optim/total_grad_norm=1.208 + train/ActionNoiseL2Loss=0.1047 + throughput/total_tokens=1,405,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7321/500000] + train/ActionNoiseL2Loss=0.0871 + throughput/total_tokens=1,405,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7322/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=1,405,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7323/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,406,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7324/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,406,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7325/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=1,406,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7326/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,406,592,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7327/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,406,784,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7328/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=1,406,976,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7329/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=1,407,168,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7330/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,407,360,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7331/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,407,552,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7332/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,407,744,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7333/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=1,407,936,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7334/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=1,408,128,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7335/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=1,408,320,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7336/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,408,512,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7337/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=1,408,704,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7338/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,408,896,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7339/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=1,409,088,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7340/500000] + optim/total_grad_norm=0.7042 + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=1,409,280,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7341/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,409,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7342/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,409,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7343/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=1,409,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7344/500000] + train/ActionNoiseL2Loss=0.0275 + throughput/total_tokens=1,410,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7345/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,410,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7346/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,410,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7347/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=1,410,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7348/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=1,410,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7349/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,411,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7350/500000] + train/ActionNoiseL2Loss=0.0289 + throughput/total_tokens=1,411,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7351/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,411,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7352/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,411,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7353/500000] + train/ActionNoiseL2Loss=0.0410 + throughput/total_tokens=1,411,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7354/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,411,968,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7355/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,412,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7356/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=1,412,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7357/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=1,412,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7358/500000] + train/ActionNoiseL2Loss=0.0326 + throughput/total_tokens=1,412,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7359/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,412,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7360/500000] + optim/total_grad_norm=0.5773 + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,413,120,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=7361/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=1,413,312,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7362/500000] + train/ActionNoiseL2Loss=0.0901 + throughput/total_tokens=1,413,504,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7363/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=1,413,696,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7364/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,413,888,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7365/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,414,080,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7366/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,414,272,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7367/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,414,464,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7368/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=1,414,656,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7369/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,414,848,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7370/500000] + train/ActionNoiseL2Loss=0.0370 + throughput/total_tokens=1,415,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7371/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=1,415,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7372/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,415,424,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7373/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=1,415,616,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7374/500000] + train/ActionNoiseL2Loss=0.0691 + throughput/total_tokens=1,415,808,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7375/500000] + train/ActionNoiseL2Loss=0.0285 + throughput/total_tokens=1,416,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7376/500000] + train/ActionNoiseL2Loss=0.0990 + throughput/total_tokens=1,416,192,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7377/500000] + train/ActionNoiseL2Loss=0.1019 + throughput/total_tokens=1,416,384,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7378/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=1,416,576,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7379/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=1,416,768,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7380/500000] + optim/total_grad_norm=0.7162 + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=1,416,960,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7381/500000] + train/ActionNoiseL2Loss=0.0691 + throughput/total_tokens=1,417,152,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7382/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,417,344,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7383/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,417,536,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7384/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,417,728,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7385/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,417,920,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7386/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=1,418,112,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7387/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,418,304,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7388/500000] + train/ActionNoiseL2Loss=0.0921 + throughput/total_tokens=1,418,496,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7389/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=1,418,688,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7390/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=1,418,880,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7391/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,419,072,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7392/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,419,264,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7393/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,419,456,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7394/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=1,419,648,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7395/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,419,840,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7396/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=1,420,032,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7397/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=1,420,224,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7398/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=1,420,416,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7399/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=1,420,608,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7400/500000] + optim/total_grad_norm=0.5995 + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,420,800,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7401/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,420,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7402/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=1,421,184,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7403/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=1,421,376,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7404/500000] + train/ActionNoiseL2Loss=0.1336 + throughput/total_tokens=1,421,568,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7405/500000] + train/ActionNoiseL2Loss=0.0826 + throughput/total_tokens=1,421,760,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7406/500000] + train/ActionNoiseL2Loss=0.1147 + throughput/total_tokens=1,421,952,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7407/500000] + train/ActionNoiseL2Loss=0.0235 + throughput/total_tokens=1,422,144,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7408/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,422,336,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7409/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=1,422,528,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7410/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,422,720,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7411/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,422,912,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7412/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,423,104,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7413/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,423,296,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7414/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=1,423,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7415/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=1,423,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7416/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=1,423,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7417/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=1,424,064,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7418/500000] + train/ActionNoiseL2Loss=0.0931 + throughput/total_tokens=1,424,256,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7419/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,424,448,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7420/500000] + optim/total_grad_norm=1.165 + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,424,640,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7421/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,424,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7422/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=1,425,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7423/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=1,425,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7424/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=1,425,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7425/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,425,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7426/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=1,425,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7427/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=1,425,984,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7428/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,426,176,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7429/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=1,426,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7430/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,426,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7431/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=1,426,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7432/500000] + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=1,426,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7433/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,427,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7434/500000] + train/ActionNoiseL2Loss=0.1293 + throughput/total_tokens=1,427,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7435/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=1,427,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7436/500000] + train/ActionNoiseL2Loss=0.0276 + throughput/total_tokens=1,427,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7437/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=1,427,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7438/500000] + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=1,428,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7439/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=1,428,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7440/500000] + optim/total_grad_norm=0.4740 + train/ActionNoiseL2Loss=0.0213 + throughput/total_tokens=1,428,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7441/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,428,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7442/500000] + train/ActionNoiseL2Loss=0.0310 + throughput/total_tokens=1,428,864,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7443/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,429,056,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7444/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=1,429,248,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7445/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,429,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7446/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=1,429,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7447/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=1,429,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7448/500000] + train/ActionNoiseL2Loss=0.1131 + throughput/total_tokens=1,430,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7449/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=1,430,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7450/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=1,430,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7451/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=1,430,592,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7452/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=1,430,784,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7453/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,430,976,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7454/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,431,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7455/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,431,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7456/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,431,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7457/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=1,431,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7458/500000] + train/ActionNoiseL2Loss=0.0329 + throughput/total_tokens=1,431,936,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7459/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,432,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7460/500000] + optim/total_grad_norm=1.085 + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=1,432,320,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=7461/500000] + train/ActionNoiseL2Loss=0.1016 + throughput/total_tokens=1,432,512,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7462/500000] + train/ActionNoiseL2Loss=0.0982 + throughput/total_tokens=1,432,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7463/500000] + train/ActionNoiseL2Loss=0.0281 + throughput/total_tokens=1,432,896,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7464/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=1,433,088,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7465/500000] + train/ActionNoiseL2Loss=0.0848 + throughput/total_tokens=1,433,280,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7466/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=1,433,472,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7467/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=1,433,664,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7468/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=1,433,856,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7469/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,434,048,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7470/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=1,434,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7471/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,434,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7472/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=1,434,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7473/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=1,434,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7474/500000] + train/ActionNoiseL2Loss=0.0289 + throughput/total_tokens=1,435,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7475/500000] + train/ActionNoiseL2Loss=0.1222 + throughput/total_tokens=1,435,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7476/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,435,392,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7477/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=1,435,584,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7478/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=1,435,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7479/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=1,435,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7480/500000] + optim/total_grad_norm=1.120 + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=1,436,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7481/500000] + train/ActionNoiseL2Loss=0.0278 + throughput/total_tokens=1,436,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7482/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,436,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7483/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=1,436,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7484/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,436,928,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7485/500000] + train/ActionNoiseL2Loss=0.0833 + throughput/total_tokens=1,437,120,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7486/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,437,312,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7487/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=1,437,504,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7488/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,437,696,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7489/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,437,888,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7490/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=1,438,080,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7491/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=1,438,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7492/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=1,438,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7493/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=1,438,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7494/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,438,848,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7495/500000] + train/ActionNoiseL2Loss=0.1053 + throughput/total_tokens=1,439,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7496/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,439,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7497/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=1,439,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7498/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,439,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7499/500000] + train/ActionNoiseL2Loss=0.0202 + throughput/total_tokens=1,439,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7500/500000] + optim/total_grad_norm=0.7244 + train/ActionNoiseL2Loss=0.0849 + throughput/total_tokens=1,440,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +10/13 [13:22:50] INFO | >> Saving config... checkpoint.py:608 +10/13 [13:23:34] INFO | >> Saving model state... checkpoint.py:796 +10/13 [13:24:46] INFO | >> Saving optim state... checkpoint.py:811 +10/13 [13:26:14] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=7501/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,440,192,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7502/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,440,384,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=7503/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=1,440,576,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7504/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,440,768,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7505/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=1,440,960,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7506/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=1,441,152,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7507/500000] + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=1,441,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7508/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=1,441,536,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7509/500000] + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=1,441,728,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7510/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=1,441,920,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7511/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,442,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7512/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,442,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7513/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,442,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7514/500000] + train/ActionNoiseL2Loss=0.0824 + throughput/total_tokens=1,442,688,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7515/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,442,880,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7516/500000] + train/ActionNoiseL2Loss=0.1366 + throughput/total_tokens=1,443,072,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7517/500000] + train/ActionNoiseL2Loss=0.1032 + throughput/total_tokens=1,443,264,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7518/500000] + train/ActionNoiseL2Loss=0.1023 + throughput/total_tokens=1,443,456,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7519/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=1,443,648,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7520/500000] + optim/total_grad_norm=1.595 + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,443,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7521/500000] + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=1,444,032,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7522/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=1,444,224,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7523/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,444,416,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7524/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,444,608,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7525/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,444,800,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7526/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=1,444,992,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7527/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=1,445,184,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7528/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,445,376,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7529/500000] + train/ActionNoiseL2Loss=0.0902 + throughput/total_tokens=1,445,568,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7530/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=1,445,760,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7531/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=1,445,952,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7532/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=1,446,144,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7533/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=1,446,336,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7534/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=1,446,528,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7535/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=1,446,720,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7536/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,446,912,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7537/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=1,447,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7538/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=1,447,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7539/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=1,447,488,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7540/500000] + optim/total_grad_norm=0.9146 + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=1,447,680,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7541/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=1,447,872,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7542/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,448,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7543/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=1,448,256,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7544/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=1,448,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7545/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,448,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7546/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,448,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7547/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=1,449,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7548/500000] + train/ActionNoiseL2Loss=0.1002 + throughput/total_tokens=1,449,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7549/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=1,449,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7550/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=1,449,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7551/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=1,449,792,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7552/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=1,449,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7553/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,450,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7554/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,450,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7555/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=1,450,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7556/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=1,450,752,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7557/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,450,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7558/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,451,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7559/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=1,451,328,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7560/500000] + optim/total_grad_norm=0.7050 + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=1,451,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=7561/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=1,451,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7562/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=1,451,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7563/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,452,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7564/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=1,452,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7565/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=1,452,480,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7566/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=1,452,672,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7567/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=1,452,864,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7568/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,453,056,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7569/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=1,453,248,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7570/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=1,453,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7571/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,453,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7572/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=1,453,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7573/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,454,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7574/500000] + train/ActionNoiseL2Loss=0.0289 + throughput/total_tokens=1,454,208,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7575/500000] + train/ActionNoiseL2Loss=0.0988 + throughput/total_tokens=1,454,400,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7576/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=1,454,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7577/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=1,454,784,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7578/500000] + train/ActionNoiseL2Loss=0.0898 + throughput/total_tokens=1,454,976,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7579/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,455,168,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7580/500000] + optim/total_grad_norm=1.059 + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,455,360,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7581/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,455,552,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7582/500000] + train/ActionNoiseL2Loss=0.0934 + throughput/total_tokens=1,455,744,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7583/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,455,936,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7584/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,456,128,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7585/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=1,456,320,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7586/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=1,456,512,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7587/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,456,704,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7588/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,456,896,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7589/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,457,088,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7590/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,457,280,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=7591/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,457,472,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7592/500000] + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=1,457,664,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7593/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=1,457,856,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7594/500000] + train/ActionNoiseL2Loss=0.0785 + throughput/total_tokens=1,458,048,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7595/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,458,240,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7596/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,458,432,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7597/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,458,624,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7598/500000] + train/ActionNoiseL2Loss=0.0285 + throughput/total_tokens=1,458,816,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7599/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=1,459,008,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7600/500000] + optim/total_grad_norm=1.073 + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,459,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7601/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,459,392,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7602/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,459,584,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7603/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=1,459,776,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7604/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,459,968,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7605/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=1,460,160,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7606/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=1,460,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7607/500000] + train/ActionNoiseL2Loss=0.1144 + throughput/total_tokens=1,460,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7608/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=1,460,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7609/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,460,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7610/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=1,461,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=7611/500000] + train/ActionNoiseL2Loss=0.0936 + throughput/total_tokens=1,461,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7612/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,461,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7613/500000] + train/ActionNoiseL2Loss=0.0318 + throughput/total_tokens=1,461,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7614/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,461,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7615/500000] + train/ActionNoiseL2Loss=0.0851 + throughput/total_tokens=1,462,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7616/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=1,462,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7617/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=1,462,464,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7618/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,462,656,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7619/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=1,462,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7620/500000] + optim/total_grad_norm=1.030 + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=1,463,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7621/500000] + train/ActionNoiseL2Loss=0.0209 + throughput/total_tokens=1,463,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7622/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=1,463,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7623/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,463,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7624/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=1,463,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7625/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,464,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7626/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,464,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7627/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=1,464,384,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7628/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,464,576,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7629/500000] + train/ActionNoiseL2Loss=0.0802 + throughput/total_tokens=1,464,768,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7630/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,464,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7631/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,465,152,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7632/500000] + train/ActionNoiseL2Loss=0.0363 + throughput/total_tokens=1,465,344,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7633/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=1,465,536,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7634/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=1,465,728,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7635/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=1,465,920,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7636/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=1,466,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7637/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,466,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7638/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=1,466,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7639/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=1,466,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7640/500000] + optim/total_grad_norm=1.282 + train/ActionNoiseL2Loss=0.1058 + throughput/total_tokens=1,466,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7641/500000] + train/ActionNoiseL2Loss=0.0322 + throughput/total_tokens=1,467,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7642/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=1,467,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7643/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=1,467,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7644/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,467,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7645/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,467,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7646/500000] + train/ActionNoiseL2Loss=0.0329 + throughput/total_tokens=1,468,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7647/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=1,468,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7648/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=1,468,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7649/500000] + train/ActionNoiseL2Loss=0.0996 + throughput/total_tokens=1,468,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7650/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,468,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7651/500000] + train/ActionNoiseL2Loss=0.1038 + throughput/total_tokens=1,468,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7652/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,469,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7653/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=1,469,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7654/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,469,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7655/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=1,469,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7656/500000] + train/ActionNoiseL2Loss=0.1144 + throughput/total_tokens=1,469,952,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7657/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=1,470,144,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7658/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,470,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7659/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=1,470,528,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7660/500000] + optim/total_grad_norm=0.8987 + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,470,720,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=7661/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,470,912,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7662/500000] + train/ActionNoiseL2Loss=0.0266 + throughput/total_tokens=1,471,104,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7663/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,471,296,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7664/500000] + train/ActionNoiseL2Loss=0.0849 + throughput/total_tokens=1,471,488,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7665/500000] + train/ActionNoiseL2Loss=0.1020 + throughput/total_tokens=1,471,680,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7666/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,471,872,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7667/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=1,472,064,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7668/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,472,256,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7669/500000] + train/ActionNoiseL2Loss=0.0874 + throughput/total_tokens=1,472,448,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7670/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=1,472,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7671/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=1,472,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7672/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,473,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7673/500000] + train/ActionNoiseL2Loss=0.0918 + throughput/total_tokens=1,473,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7674/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,473,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7675/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,473,600,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7676/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,473,792,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7677/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,473,984,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7678/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=1,474,176,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7679/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=1,474,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7680/500000] + optim/total_grad_norm=0.7804 + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=1,474,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7681/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,474,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7682/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=1,474,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7683/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,475,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7684/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=1,475,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7685/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=1,475,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7686/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,475,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7687/500000] + train/ActionNoiseL2Loss=0.0706 + throughput/total_tokens=1,475,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7688/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=1,476,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7689/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=1,476,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7690/500000] + train/ActionNoiseL2Loss=0.0985 + throughput/total_tokens=1,476,480,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7691/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=1,476,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7692/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=1,476,864,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7693/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,477,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7694/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,477,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7695/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,477,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7696/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,477,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7697/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=1,477,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7698/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,478,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7699/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,478,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7700/500000] + optim/total_grad_norm=1.117 + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,478,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7701/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=1,478,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7702/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,478,784,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7703/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=1,478,976,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7704/500000] + train/ActionNoiseL2Loss=0.0298 + throughput/total_tokens=1,479,168,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7705/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=1,479,360,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7706/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=1,479,552,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7707/500000] + train/ActionNoiseL2Loss=0.0344 + throughput/total_tokens=1,479,744,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7708/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=1,479,936,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7709/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,480,128,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7710/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,480,320,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=7711/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,480,512,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7712/500000] + train/ActionNoiseL2Loss=0.1229 + throughput/total_tokens=1,480,704,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7713/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,480,896,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7714/500000] + train/ActionNoiseL2Loss=0.0330 + throughput/total_tokens=1,481,088,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7715/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,481,280,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7716/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=1,481,472,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7717/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,481,664,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7718/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,481,856,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7719/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,482,048,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7720/500000] + optim/total_grad_norm=0.6298 + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,482,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7721/500000] + train/ActionNoiseL2Loss=0.0259 + throughput/total_tokens=1,482,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7722/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,482,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7723/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,482,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7724/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,483,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7725/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,483,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7726/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,483,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7727/500000] + train/ActionNoiseL2Loss=0.0887 + throughput/total_tokens=1,483,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7728/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,483,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7729/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,483,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7730/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=1,484,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7731/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,484,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7732/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,484,544,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7733/500000] + train/ActionNoiseL2Loss=0.0992 + throughput/total_tokens=1,484,736,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7734/500000] + train/ActionNoiseL2Loss=0.0301 + throughput/total_tokens=1,484,928,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7735/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,485,120,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7736/500000] + train/ActionNoiseL2Loss=0.0300 + throughput/total_tokens=1,485,312,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7737/500000] + train/ActionNoiseL2Loss=0.0267 + throughput/total_tokens=1,485,504,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7738/500000] + train/ActionNoiseL2Loss=0.0927 + throughput/total_tokens=1,485,696,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7739/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,485,888,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7740/500000] + optim/total_grad_norm=0.9700 + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,486,080,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7741/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,486,272,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7742/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=1,486,464,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7743/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,486,656,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7744/500000] + train/ActionNoiseL2Loss=0.1218 + throughput/total_tokens=1,486,848,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7745/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,487,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7746/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,487,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7747/500000] + train/ActionNoiseL2Loss=0.1283 + throughput/total_tokens=1,487,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7748/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=1,487,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7749/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,487,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7750/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=1,488,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7751/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=1,488,192,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7752/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=1,488,384,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7753/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,488,576,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7754/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,488,768,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7755/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,488,960,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7756/500000] + train/ActionNoiseL2Loss=0.1074 + throughput/total_tokens=1,489,152,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7757/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,489,344,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7758/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=1,489,536,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7759/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=1,489,728,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7760/500000] + optim/total_grad_norm=0.6130 + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,489,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7761/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=1,490,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7762/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,490,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7763/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,490,496,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7764/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,490,688,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7765/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=1,490,880,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7766/500000] + train/ActionNoiseL2Loss=0.0845 + throughput/total_tokens=1,491,072,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7767/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,491,264,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7768/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=1,491,456,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7769/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,491,648,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7770/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,491,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7771/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,492,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7772/500000] + train/ActionNoiseL2Loss=0.0853 + throughput/total_tokens=1,492,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7773/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,492,416,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7774/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,492,608,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7775/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,492,800,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7776/500000] + train/ActionNoiseL2Loss=0.1210 + throughput/total_tokens=1,492,992,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7777/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,493,184,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7778/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=1,493,376,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7779/500000] + train/ActionNoiseL2Loss=0.1006 + throughput/total_tokens=1,493,568,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7780/500000] + optim/total_grad_norm=0.8667 + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,493,760,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7781/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,493,952,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7782/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=1,494,144,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7783/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=1,494,336,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7784/500000] + train/ActionNoiseL2Loss=0.0914 + throughput/total_tokens=1,494,528,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7785/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=1,494,720,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7786/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=1,494,912,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7787/500000] + train/ActionNoiseL2Loss=0.1602 + throughput/total_tokens=1,495,104,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7788/500000] + train/ActionNoiseL2Loss=0.1025 + throughput/total_tokens=1,495,296,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7789/500000] + train/ActionNoiseL2Loss=0.1228 + throughput/total_tokens=1,495,488,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7790/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=1,495,680,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7791/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=1,495,872,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=7792/500000] + train/ActionNoiseL2Loss=0.0337 + throughput/total_tokens=1,496,064,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7793/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,496,256,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7794/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=1,496,448,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7795/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=1,496,640,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7796/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=1,496,832,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7797/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,497,024,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7798/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,497,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7799/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=1,497,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7800/500000] + optim/total_grad_norm=1.035 + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=1,497,600,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7801/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,497,792,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7802/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=1,497,984,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7803/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,498,176,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7804/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=1,498,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7805/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=1,498,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7806/500000] + train/ActionNoiseL2Loss=0.0921 + throughput/total_tokens=1,498,752,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7807/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=1,498,944,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7808/500000] + train/ActionNoiseL2Loss=0.0279 + throughput/total_tokens=1,499,136,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7809/500000] + train/ActionNoiseL2Loss=0.0905 + throughput/total_tokens=1,499,328,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=7810/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,499,520,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=7811/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=1,499,712,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7812/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,499,904,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7813/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,500,096,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7814/500000] + train/ActionNoiseL2Loss=0.0802 + throughput/total_tokens=1,500,288,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7815/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,500,480,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7816/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=1,500,672,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7817/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,500,864,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7818/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=1,501,056,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7819/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=1,501,248,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7820/500000] + optim/total_grad_norm=0.8635 + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,501,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7821/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=1,501,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7822/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=1,501,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7823/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=1,502,016,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7824/500000] + train/ActionNoiseL2Loss=0.0840 + throughput/total_tokens=1,502,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7825/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=1,502,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7826/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,502,592,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7827/500000] + train/ActionNoiseL2Loss=0.0329 + throughput/total_tokens=1,502,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7828/500000] + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=1,502,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7829/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,503,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7830/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=1,503,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7831/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,503,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7832/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=1,503,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7833/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,503,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7834/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,504,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7835/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=1,504,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7836/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,504,512,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7837/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=1,504,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7838/500000] + train/ActionNoiseL2Loss=0.0343 + throughput/total_tokens=1,504,896,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7839/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,505,088,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=7840/500000] + optim/total_grad_norm=0.6860 + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,505,280,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7841/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=1,505,472,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7842/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=1,505,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7843/500000] + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=1,505,856,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7844/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=1,506,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7845/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,506,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7846/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=1,506,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7847/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=1,506,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7848/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,506,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7849/500000] + train/ActionNoiseL2Loss=0.0344 + throughput/total_tokens=1,507,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7850/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=1,507,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7851/500000] + train/ActionNoiseL2Loss=0.0361 + throughput/total_tokens=1,507,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7852/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=1,507,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7853/500000] + train/ActionNoiseL2Loss=0.0892 + throughput/total_tokens=1,507,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7854/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,507,968,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7855/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=1,508,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7856/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,508,352,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7857/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=1,508,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7858/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=1,508,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7859/500000] + train/ActionNoiseL2Loss=0.0273 + throughput/total_tokens=1,508,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7860/500000] + optim/total_grad_norm=1.179 + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=1,509,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=7861/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,509,312,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7862/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,509,504,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7863/500000] + train/ActionNoiseL2Loss=0.0272 + throughput/total_tokens=1,509,696,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7864/500000] + train/ActionNoiseL2Loss=0.0909 + throughput/total_tokens=1,509,888,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7865/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=1,510,080,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7866/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,510,272,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7867/500000] + train/ActionNoiseL2Loss=0.0185 + throughput/total_tokens=1,510,464,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7868/500000] + train/ActionNoiseL2Loss=0.0833 + throughput/total_tokens=1,510,656,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7869/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=1,510,848,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7870/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,511,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7871/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=1,511,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7872/500000] + train/ActionNoiseL2Loss=0.0318 + throughput/total_tokens=1,511,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7873/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=1,511,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7874/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,511,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7875/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,512,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7876/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=1,512,192,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7877/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=1,512,384,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7878/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,512,576,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7879/500000] + train/ActionNoiseL2Loss=0.0867 + throughput/total_tokens=1,512,768,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7880/500000] + optim/total_grad_norm=0.5519 + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=1,512,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7881/500000] + train/ActionNoiseL2Loss=0.0219 + throughput/total_tokens=1,513,152,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7882/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,513,344,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7883/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,513,536,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7884/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=1,513,728,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7885/500000] + train/ActionNoiseL2Loss=0.0896 + throughput/total_tokens=1,513,920,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7886/500000] + train/ActionNoiseL2Loss=0.1233 + throughput/total_tokens=1,514,112,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7887/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,514,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7888/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=1,514,496,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7889/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=1,514,688,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7890/500000] + train/ActionNoiseL2Loss=0.0311 + throughput/total_tokens=1,514,880,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7891/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=1,515,072,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7892/500000] + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=1,515,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7893/500000] + train/ActionNoiseL2Loss=0.0309 + throughput/total_tokens=1,515,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7894/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=1,515,648,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7895/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,515,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7896/500000] + train/ActionNoiseL2Loss=0.0976 + throughput/total_tokens=1,516,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7897/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=1,516,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7898/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,516,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7899/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,516,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7900/500000] + optim/total_grad_norm=1.352 + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=1,516,800,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7901/500000] + train/ActionNoiseL2Loss=0.0956 + throughput/total_tokens=1,516,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7902/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,517,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7903/500000] + train/ActionNoiseL2Loss=0.0990 + throughput/total_tokens=1,517,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7904/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=1,517,568,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7905/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=1,517,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7906/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,517,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7907/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=1,518,144,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7908/500000] + train/ActionNoiseL2Loss=0.0824 + throughput/total_tokens=1,518,336,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7909/500000] + train/ActionNoiseL2Loss=0.0895 + throughput/total_tokens=1,518,528,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7910/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=1,518,720,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=7911/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=1,518,912,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7912/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,519,104,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7913/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=1,519,296,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7914/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,519,488,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7915/500000] + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=1,519,680,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7916/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=1,519,872,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7917/500000] + train/ActionNoiseL2Loss=0.1364 + throughput/total_tokens=1,520,064,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7918/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=1,520,256,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7919/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,520,448,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=7920/500000] + optim/total_grad_norm=1.001 + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,520,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=7921/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=1,520,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7922/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,521,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7923/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=1,521,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7924/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=1,521,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7925/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,521,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7926/500000] + train/ActionNoiseL2Loss=0.1191 + throughput/total_tokens=1,521,792,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7927/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=1,521,984,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7928/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,522,176,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7929/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=1,522,368,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7930/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=1,522,560,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7931/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=1,522,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7932/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=1,522,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7933/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=1,523,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7934/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,523,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7935/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,523,520,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7936/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=1,523,712,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7937/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=1,523,904,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7938/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,524,096,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7939/500000] + train/ActionNoiseL2Loss=0.0338 + throughput/total_tokens=1,524,288,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7940/500000] + optim/total_grad_norm=0.6436 + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=1,524,480,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7941/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,524,672,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7942/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,524,864,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7943/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,525,056,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7944/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=1,525,248,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7945/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,525,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7946/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,525,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7947/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=1,525,824,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7948/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,526,016,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7949/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=1,526,208,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=7950/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,526,400,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7951/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=1,526,592,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7952/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,526,784,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7953/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,526,976,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7954/500000] + train/ActionNoiseL2Loss=0.0313 + throughput/total_tokens=1,527,168,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7955/500000] + train/ActionNoiseL2Loss=0.1087 + throughput/total_tokens=1,527,360,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7956/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=1,527,552,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7957/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,527,744,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7958/500000] + train/ActionNoiseL2Loss=0.0838 + throughput/total_tokens=1,527,936,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7959/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,528,128,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7960/500000] + optim/total_grad_norm=0.8987 + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=1,528,320,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=7961/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=1,528,512,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=7962/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=1,528,704,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7963/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,528,896,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7964/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=1,529,088,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7965/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=1,529,280,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7966/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,529,472,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7967/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=1,529,664,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7968/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=1,529,856,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7969/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=1,530,048,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=7970/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,530,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7971/500000] + train/ActionNoiseL2Loss=0.0987 + throughput/total_tokens=1,530,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7972/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=1,530,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7973/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=1,530,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7974/500000] + train/ActionNoiseL2Loss=0.0355 + throughput/total_tokens=1,531,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7975/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,531,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7976/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,531,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7977/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=1,531,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7978/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,531,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7979/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,531,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7980/500000] + optim/total_grad_norm=0.9633 + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,532,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7981/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=1,532,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7982/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=1,532,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=7983/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=1,532,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7984/500000] + train/ActionNoiseL2Loss=0.0925 + throughput/total_tokens=1,532,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7985/500000] + train/ActionNoiseL2Loss=0.0316 + throughput/total_tokens=1,533,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7986/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,533,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7987/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,533,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7988/500000] + train/ActionNoiseL2Loss=0.0856 + throughput/total_tokens=1,533,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7989/500000] + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=1,533,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7990/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=1,534,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=7991/500000] + train/ActionNoiseL2Loss=0.0385 + throughput/total_tokens=1,534,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7992/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=1,534,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7993/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,534,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=7994/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=1,534,848,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=7995/500000] + train/ActionNoiseL2Loss=0.0287 + throughput/total_tokens=1,535,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7996/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,535,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7997/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=1,535,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7998/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,535,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=7999/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=1,535,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8000/500000] + optim/total_grad_norm=0.8897 + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=1,536,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +10/13 [16:22:22] INFO | >> Saving config... checkpoint.py:608 +10/13 [16:22:55] INFO | >> Saving model state... checkpoint.py:796 +10/13 [16:24:07] INFO | >> Saving optim state... checkpoint.py:811 +10/13 [16:25:37] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=8001/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,536,192,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=8002/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,536,384,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=8003/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,536,576,000 + throughput/device/tokens_per_second=1,128 + throughput/device/batches_per_second=0.0470 +[step=8004/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,536,768,000 + throughput/device/tokens_per_second=1,132 + throughput/device/batches_per_second=0.0472 +[step=8005/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=1,536,960,000 + throughput/device/tokens_per_second=1,136 + throughput/device/batches_per_second=0.0473 +[step=8006/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=1,537,152,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=8007/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,537,344,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=8008/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=1,537,536,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=8009/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=1,537,728,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=8010/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=1,537,920,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=8011/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,538,112,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=8012/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=1,538,304,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=8013/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,538,496,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8014/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,538,688,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8015/500000] + train/ActionNoiseL2Loss=0.1069 + throughput/total_tokens=1,538,880,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8016/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,539,072,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8017/500000] + train/ActionNoiseL2Loss=0.0259 + throughput/total_tokens=1,539,264,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8018/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=1,539,456,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8019/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=1,539,648,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8020/500000] + optim/total_grad_norm=1.452 + train/ActionNoiseL2Loss=0.1117 + throughput/total_tokens=1,539,840,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=8021/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,540,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=8022/500000] + train/ActionNoiseL2Loss=0.0752 + throughput/total_tokens=1,540,224,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8023/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,540,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8024/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,540,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8025/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=1,540,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8026/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,540,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8027/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=1,541,184,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8028/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,541,376,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8029/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=1,541,568,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8030/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,541,760,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8031/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,541,952,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8032/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=1,542,144,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8033/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=1,542,336,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8034/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,542,528,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8035/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=1,542,720,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8036/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=1,542,912,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8037/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=1,543,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8038/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=1,543,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8039/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=1,543,488,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8040/500000] + optim/total_grad_norm=0.9251 + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=1,543,680,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8041/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,543,872,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8042/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=1,544,064,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8043/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=1,544,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8044/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=1,544,448,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8045/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,544,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8046/500000] + train/ActionNoiseL2Loss=0.0910 + throughput/total_tokens=1,544,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8047/500000] + train/ActionNoiseL2Loss=0.1059 + throughput/total_tokens=1,545,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8048/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=1,545,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8049/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=1,545,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8050/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,545,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8051/500000] + train/ActionNoiseL2Loss=0.0824 + throughput/total_tokens=1,545,792,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=8052/500000] + train/ActionNoiseL2Loss=0.0355 + throughput/total_tokens=1,545,984,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8053/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=1,546,176,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=8054/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,546,368,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8055/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,546,560,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8056/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=1,546,752,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8057/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,546,944,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8058/500000] + train/ActionNoiseL2Loss=0.0752 + throughput/total_tokens=1,547,136,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8059/500000] + train/ActionNoiseL2Loss=0.0202 + throughput/total_tokens=1,547,328,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8060/500000] + optim/total_grad_norm=0.9665 + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=1,547,520,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=8061/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,547,712,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8062/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=1,547,904,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8063/500000] + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=1,548,096,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8064/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,548,288,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8065/500000] + train/ActionNoiseL2Loss=0.0253 + throughput/total_tokens=1,548,480,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8066/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,548,672,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8067/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,548,864,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8068/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,549,056,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8069/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,549,248,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8070/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=1,549,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8071/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=1,549,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8072/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=1,549,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8073/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,550,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8074/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=1,550,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8075/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=1,550,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8076/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=1,550,592,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8077/500000] + train/ActionNoiseL2Loss=0.1093 + throughput/total_tokens=1,550,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8078/500000] + train/ActionNoiseL2Loss=0.0927 + throughput/total_tokens=1,550,976,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8079/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=1,551,168,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8080/500000] + optim/total_grad_norm=0.8557 + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,551,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8081/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,551,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8082/500000] + train/ActionNoiseL2Loss=0.0995 + throughput/total_tokens=1,551,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8083/500000] + train/ActionNoiseL2Loss=0.0263 + throughput/total_tokens=1,551,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8084/500000] + train/ActionNoiseL2Loss=0.0898 + throughput/total_tokens=1,552,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8085/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,552,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8086/500000] + train/ActionNoiseL2Loss=0.1043 + throughput/total_tokens=1,552,512,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8087/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,552,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8088/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,552,896,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8089/500000] + train/ActionNoiseL2Loss=0.0691 + throughput/total_tokens=1,553,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8090/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=1,553,280,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8091/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,553,472,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8092/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=1,553,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8093/500000] + train/ActionNoiseL2Loss=0.0280 + throughput/total_tokens=1,553,856,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8094/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=1,554,048,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8095/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,554,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8096/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=1,554,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8097/500000] + train/ActionNoiseL2Loss=0.0337 + throughput/total_tokens=1,554,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8098/500000] + train/ActionNoiseL2Loss=0.0743 + throughput/total_tokens=1,554,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8099/500000] + train/ActionNoiseL2Loss=0.0230 + throughput/total_tokens=1,555,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8100/500000] + optim/total_grad_norm=0.7059 + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,555,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8101/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=1,555,392,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=8102/500000] + train/ActionNoiseL2Loss=0.0331 + throughput/total_tokens=1,555,584,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=8103/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=1,555,776,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=8104/500000] + train/ActionNoiseL2Loss=0.0966 + throughput/total_tokens=1,555,968,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=8105/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=1,556,160,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=8106/500000] + train/ActionNoiseL2Loss=0.0286 + throughput/total_tokens=1,556,352,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=8107/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=1,556,544,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=8108/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,556,736,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=8109/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,556,928,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=8110/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=1,557,120,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 + System/Peak GPU Memory (MB)=51,076 +[step=8111/500000] + train/ActionNoiseL2Loss=0.1054 + throughput/total_tokens=1,557,312,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=8112/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=1,557,504,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=8113/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,557,696,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=8114/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=1,557,888,000 + throughput/device/tokens_per_second=1,133 + throughput/device/batches_per_second=0.0472 +[step=8115/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,558,080,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=8116/500000] + train/ActionNoiseL2Loss=0.1109 + throughput/total_tokens=1,558,272,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=8117/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,558,464,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=8118/500000] + train/ActionNoiseL2Loss=0.0747 + throughput/total_tokens=1,558,656,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=8119/500000] + train/ActionNoiseL2Loss=0.0898 + throughput/total_tokens=1,558,848,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=8120/500000] + optim/total_grad_norm=0.6698 + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,559,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8121/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=1,559,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8122/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=1,559,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8123/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,559,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8124/500000] + train/ActionNoiseL2Loss=0.0410 + throughput/total_tokens=1,559,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8125/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,560,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8126/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=1,560,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8127/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=1,560,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8128/500000] + train/ActionNoiseL2Loss=0.0367 + throughput/total_tokens=1,560,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8129/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=1,560,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8130/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=1,560,960,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8131/500000] + train/ActionNoiseL2Loss=0.0359 + throughput/total_tokens=1,561,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8132/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=1,561,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8133/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=1,561,536,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8134/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,561,728,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8135/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=1,561,920,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8136/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=1,562,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8137/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,562,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8138/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,562,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8139/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,562,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8140/500000] + optim/total_grad_norm=0.7530 + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=1,562,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8141/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=1,563,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8142/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,563,264,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8143/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,563,456,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8144/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=1,563,648,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8145/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=1,563,840,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8146/500000] + train/ActionNoiseL2Loss=0.0747 + throughput/total_tokens=1,564,032,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8147/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,564,224,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8148/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,564,416,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8149/500000] + train/ActionNoiseL2Loss=0.0836 + throughput/total_tokens=1,564,608,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=8150/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=1,564,800,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8151/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,564,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8152/500000] + train/ActionNoiseL2Loss=0.1056 + throughput/total_tokens=1,565,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8153/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,565,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8154/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=1,565,568,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8155/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,565,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8156/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=1,565,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8157/500000] + train/ActionNoiseL2Loss=0.0881 + throughput/total_tokens=1,566,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8158/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,566,336,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8159/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=1,566,528,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8160/500000] + optim/total_grad_norm=1.707 + train/ActionNoiseL2Loss=0.0923 + throughput/total_tokens=1,566,720,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=8161/500000] + train/ActionNoiseL2Loss=0.0363 + throughput/total_tokens=1,566,912,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8162/500000] + train/ActionNoiseL2Loss=0.0242 + throughput/total_tokens=1,567,104,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8163/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=1,567,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8164/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=1,567,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8165/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=1,567,680,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8166/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=1,567,872,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8167/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=1,568,064,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8168/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,568,256,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8169/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,568,448,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8170/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=1,568,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8171/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,568,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8172/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=1,569,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8173/500000] + train/ActionNoiseL2Loss=0.0832 + throughput/total_tokens=1,569,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8174/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=1,569,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8175/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=1,569,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8176/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=1,569,792,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8177/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=1,569,984,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8178/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,570,176,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8179/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,570,368,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8180/500000] + optim/total_grad_norm=1.127 + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=1,570,560,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8181/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,570,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8182/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,570,944,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8183/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=1,571,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8184/500000] + train/ActionNoiseL2Loss=0.1298 + throughput/total_tokens=1,571,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8185/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=1,571,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8186/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=1,571,712,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8187/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=1,571,904,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8188/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=1,572,096,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8189/500000] + train/ActionNoiseL2Loss=0.0747 + throughput/total_tokens=1,572,288,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8190/500000] + train/ActionNoiseL2Loss=0.0976 + throughput/total_tokens=1,572,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8191/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,572,672,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8192/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=1,572,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8193/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,573,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8194/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=1,573,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8195/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,573,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8196/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,573,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8197/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=1,573,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8198/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,574,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8199/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,574,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8200/500000] + optim/total_grad_norm=0.5457 + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,574,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8201/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=1,574,592,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8202/500000] + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=1,574,784,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8203/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=1,574,976,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8204/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,575,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8205/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,575,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8206/500000] + train/ActionNoiseL2Loss=0.0318 + throughput/total_tokens=1,575,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8207/500000] + train/ActionNoiseL2Loss=0.0229 + throughput/total_tokens=1,575,744,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8208/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,575,936,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8209/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=1,576,128,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8210/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=1,576,320,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=8211/500000] + train/ActionNoiseL2Loss=0.0792 + throughput/total_tokens=1,576,512,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8212/500000] + train/ActionNoiseL2Loss=0.0388 + throughput/total_tokens=1,576,704,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8213/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=1,576,896,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8214/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,577,088,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8215/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,577,280,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8216/500000] + train/ActionNoiseL2Loss=0.1010 + throughput/total_tokens=1,577,472,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8217/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,577,664,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8218/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=1,577,856,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8219/500000] + train/ActionNoiseL2Loss=0.0316 + throughput/total_tokens=1,578,048,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8220/500000] + optim/total_grad_norm=0.4183 + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,578,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8221/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=1,578,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8222/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,578,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8223/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=1,578,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8224/500000] + train/ActionNoiseL2Loss=0.0922 + throughput/total_tokens=1,579,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8225/500000] + train/ActionNoiseL2Loss=0.0329 + throughput/total_tokens=1,579,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8226/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=1,579,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8227/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,579,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8228/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=1,579,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8229/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,579,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8230/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,580,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8231/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,580,352,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8232/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,580,544,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8233/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=1,580,736,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8234/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=1,580,928,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8235/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,581,120,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8236/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,581,312,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8237/500000] + train/ActionNoiseL2Loss=0.1405 + throughput/total_tokens=1,581,504,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8238/500000] + train/ActionNoiseL2Loss=0.0884 + throughput/total_tokens=1,581,696,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8239/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=1,581,888,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8240/500000] + optim/total_grad_norm=0.5756 + train/ActionNoiseL2Loss=0.0312 + throughput/total_tokens=1,582,080,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8241/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,582,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8242/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,582,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8243/500000] + train/ActionNoiseL2Loss=0.0250 + throughput/total_tokens=1,582,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8244/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,582,848,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8245/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=1,583,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8246/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,583,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8247/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=1,583,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8248/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=1,583,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8249/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,583,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8250/500000] + train/ActionNoiseL2Loss=0.1145 + throughput/total_tokens=1,584,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8251/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,584,192,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8252/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=1,584,384,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8253/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,584,576,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8254/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,584,768,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8255/500000] + train/ActionNoiseL2Loss=0.0274 + throughput/total_tokens=1,584,960,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8256/500000] + train/ActionNoiseL2Loss=0.0223 + throughput/total_tokens=1,585,152,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8257/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=1,585,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8258/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,585,536,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8259/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=1,585,728,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8260/500000] + optim/total_grad_norm=0.8597 + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,585,920,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=8261/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=1,586,112,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8262/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,586,304,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8263/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,586,496,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8264/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,586,688,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8265/500000] + train/ActionNoiseL2Loss=0.0272 + throughput/total_tokens=1,586,880,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8266/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=1,587,072,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8267/500000] + train/ActionNoiseL2Loss=0.1019 + throughput/total_tokens=1,587,264,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8268/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=1,587,456,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8269/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=1,587,648,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8270/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,587,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8271/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,588,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8272/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=1,588,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8273/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,588,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8274/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=1,588,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8275/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=1,588,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8276/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=1,588,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8277/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,589,184,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8278/500000] + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=1,589,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8279/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=1,589,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8280/500000] + optim/total_grad_norm=0.5536 + train/ActionNoiseL2Loss=0.0289 + throughput/total_tokens=1,589,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8281/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=1,589,952,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8282/500000] + train/ActionNoiseL2Loss=0.1038 + throughput/total_tokens=1,590,144,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8283/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=1,590,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8284/500000] + train/ActionNoiseL2Loss=0.0363 + throughput/total_tokens=1,590,528,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8285/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,590,720,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8286/500000] + train/ActionNoiseL2Loss=0.0295 + throughput/total_tokens=1,590,912,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8287/500000] + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=1,591,104,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8288/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=1,591,296,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8289/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=1,591,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8290/500000] + train/ActionNoiseL2Loss=0.0939 + throughput/total_tokens=1,591,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8291/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=1,591,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8292/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=1,592,064,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8293/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,592,256,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8294/500000] + train/ActionNoiseL2Loss=0.0849 + throughput/total_tokens=1,592,448,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8295/500000] + train/ActionNoiseL2Loss=0.0987 + throughput/total_tokens=1,592,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8296/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=1,592,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8297/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,593,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8298/500000] + train/ActionNoiseL2Loss=0.1145 + throughput/total_tokens=1,593,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8299/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=1,593,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8300/500000] + optim/total_grad_norm=0.6289 + train/ActionNoiseL2Loss=0.0301 + throughput/total_tokens=1,593,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8301/500000] + train/ActionNoiseL2Loss=0.0292 + throughput/total_tokens=1,593,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8302/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=1,593,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8303/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,594,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8304/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,594,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8305/500000] + train/ActionNoiseL2Loss=0.0410 + throughput/total_tokens=1,594,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8306/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,594,752,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8307/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,594,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8308/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=1,595,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8309/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,595,328,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8310/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=1,595,520,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=8311/500000] + train/ActionNoiseL2Loss=0.0868 + throughput/total_tokens=1,595,712,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8312/500000] + train/ActionNoiseL2Loss=0.0388 + throughput/total_tokens=1,595,904,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8313/500000] + train/ActionNoiseL2Loss=0.0951 + throughput/total_tokens=1,596,096,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8314/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,596,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8315/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,596,480,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8316/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,596,672,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8317/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=1,596,864,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8318/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=1,597,056,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8319/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,597,248,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8320/500000] + optim/total_grad_norm=0.9744 + train/ActionNoiseL2Loss=0.0741 + throughput/total_tokens=1,597,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8321/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,597,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8322/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,597,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8323/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=1,598,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8324/500000] + train/ActionNoiseL2Loss=0.0344 + throughput/total_tokens=1,598,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8325/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=1,598,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8326/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=1,598,592,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8327/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,598,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8328/500000] + train/ActionNoiseL2Loss=0.0325 + throughput/total_tokens=1,598,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8329/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=1,599,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8330/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=1,599,360,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8331/500000] + train/ActionNoiseL2Loss=0.0296 + throughput/total_tokens=1,599,552,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8332/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=1,599,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8333/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=1,599,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8334/500000] + train/ActionNoiseL2Loss=0.0973 + throughput/total_tokens=1,600,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8335/500000] + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=1,600,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8336/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,600,512,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8337/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,600,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8338/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=1,600,896,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8339/500000] + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=1,601,088,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8340/500000] + optim/total_grad_norm=0.6366 + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,601,280,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8341/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=1,601,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8342/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=1,601,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8343/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=1,601,856,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8344/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=1,602,048,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8345/500000] + train/ActionNoiseL2Loss=0.1080 + throughput/total_tokens=1,602,240,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8346/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=1,602,432,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8347/500000] + train/ActionNoiseL2Loss=0.0320 + throughput/total_tokens=1,602,624,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8348/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=1,602,816,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8349/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=1,603,008,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8350/500000] + train/ActionNoiseL2Loss=0.0232 + throughput/total_tokens=1,603,200,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8351/500000] + train/ActionNoiseL2Loss=0.0204 + throughput/total_tokens=1,603,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8352/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,603,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8353/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=1,603,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8354/500000] + train/ActionNoiseL2Loss=0.1197 + throughput/total_tokens=1,603,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8355/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=1,604,160,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8356/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=1,604,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8357/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=1,604,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8358/500000] + train/ActionNoiseL2Loss=0.0763 + throughput/total_tokens=1,604,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8359/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=1,604,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8360/500000] + optim/total_grad_norm=1.142 + train/ActionNoiseL2Loss=0.1179 + throughput/total_tokens=1,605,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=8361/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=1,605,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8362/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=1,605,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8363/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=1,605,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8364/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=1,605,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8365/500000] + train/ActionNoiseL2Loss=0.0876 + throughput/total_tokens=1,606,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8366/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=1,606,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8367/500000] + train/ActionNoiseL2Loss=0.0917 + throughput/total_tokens=1,606,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8368/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=1,606,656,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8369/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,606,848,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8370/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=1,607,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8371/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,607,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8372/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=1,607,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8373/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=1,607,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8374/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=1,607,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8375/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=1,608,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8376/500000] + train/ActionNoiseL2Loss=0.0859 + throughput/total_tokens=1,608,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8377/500000] + train/ActionNoiseL2Loss=0.0848 + throughput/total_tokens=1,608,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8378/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=1,608,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8379/500000] + train/ActionNoiseL2Loss=0.1279 + throughput/total_tokens=1,608,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8380/500000] + optim/total_grad_norm=1.409 + train/ActionNoiseL2Loss=0.0865 + throughput/total_tokens=1,608,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8381/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=1,609,152,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8382/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,609,344,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8383/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=1,609,536,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8384/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=1,609,728,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8385/500000] + train/ActionNoiseL2Loss=0.0290 + throughput/total_tokens=1,609,920,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8386/500000] + train/ActionNoiseL2Loss=0.1027 + throughput/total_tokens=1,610,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8387/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,610,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8388/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,610,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8389/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=1,610,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8390/500000] + train/ActionNoiseL2Loss=0.1478 + throughput/total_tokens=1,610,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8391/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,611,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8392/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=1,611,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8393/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,611,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8394/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,611,648,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8395/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,611,840,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8396/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,612,032,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8397/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=1,612,224,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8398/500000] + train/ActionNoiseL2Loss=0.0875 + throughput/total_tokens=1,612,416,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8399/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=1,612,608,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8400/500000] + optim/total_grad_norm=1.056 + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,612,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8401/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=1,612,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8402/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,613,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8403/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=1,613,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8404/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,613,568,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8405/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,613,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8406/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=1,613,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8407/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,614,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8408/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,614,336,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8409/500000] + train/ActionNoiseL2Loss=0.1314 + throughput/total_tokens=1,614,528,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8410/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=1,614,720,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=8411/500000] + train/ActionNoiseL2Loss=0.0936 + throughput/total_tokens=1,614,912,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8412/500000] + train/ActionNoiseL2Loss=0.0987 + throughput/total_tokens=1,615,104,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8413/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,615,296,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8414/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,615,488,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8415/500000] + train/ActionNoiseL2Loss=0.0928 + throughput/total_tokens=1,615,680,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8416/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=1,615,872,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8417/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,616,064,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8418/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,616,256,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8419/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,616,448,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=8420/500000] + optim/total_grad_norm=0.6346 + train/ActionNoiseL2Loss=0.0303 + throughput/total_tokens=1,616,640,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8421/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=1,616,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8422/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=1,617,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8423/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=1,617,216,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8424/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,617,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8425/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=1,617,600,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8426/500000] + train/ActionNoiseL2Loss=0.0391 + throughput/total_tokens=1,617,792,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8427/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=1,617,984,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8428/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=1,618,176,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8429/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=1,618,368,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8430/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,618,560,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8431/500000] + train/ActionNoiseL2Loss=0.1015 + throughput/total_tokens=1,618,752,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8432/500000] + train/ActionNoiseL2Loss=0.0902 + throughput/total_tokens=1,618,944,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8433/500000] + train/ActionNoiseL2Loss=0.0329 + throughput/total_tokens=1,619,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8434/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=1,619,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8435/500000] + train/ActionNoiseL2Loss=0.0288 + throughput/total_tokens=1,619,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8436/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,619,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8437/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,619,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8438/500000] + train/ActionNoiseL2Loss=0.0868 + throughput/total_tokens=1,620,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8439/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=1,620,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8440/500000] + optim/total_grad_norm=0.8669 + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,620,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8441/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,620,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8442/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,620,864,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8443/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=1,621,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8444/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,621,248,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8445/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=1,621,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8446/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,621,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8447/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=1,621,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8448/500000] + train/ActionNoiseL2Loss=0.0826 + throughput/total_tokens=1,622,016,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8449/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=1,622,208,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8450/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=1,622,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8451/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=1,622,592,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8452/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=1,622,784,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8453/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=1,622,976,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8454/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=1,623,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8455/500000] + train/ActionNoiseL2Loss=0.0338 + throughput/total_tokens=1,623,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8456/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,623,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8457/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=1,623,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8458/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,623,936,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8459/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=1,624,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8460/500000] + optim/total_grad_norm=0.8848 + train/ActionNoiseL2Loss=0.0969 + throughput/total_tokens=1,624,320,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=8461/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=1,624,512,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8462/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=1,624,704,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8463/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,624,896,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8464/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,625,088,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8465/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,625,280,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8466/500000] + train/ActionNoiseL2Loss=0.0391 + throughput/total_tokens=1,625,472,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8467/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,625,664,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8468/500000] + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=1,625,856,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8469/500000] + train/ActionNoiseL2Loss=0.0309 + throughput/total_tokens=1,626,048,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8470/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=1,626,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8471/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=1,626,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8472/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,626,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8473/500000] + train/ActionNoiseL2Loss=0.0995 + throughput/total_tokens=1,626,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8474/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=1,627,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8475/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,627,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8476/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,627,392,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8477/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,627,584,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8478/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=1,627,776,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8479/500000] + train/ActionNoiseL2Loss=0.0892 + throughput/total_tokens=1,627,968,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8480/500000] + optim/total_grad_norm=0.6619 + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,628,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8481/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,628,352,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8482/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=1,628,544,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8483/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=1,628,736,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8484/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,628,928,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8485/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=1,629,120,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8486/500000] + train/ActionNoiseL2Loss=0.0965 + throughput/total_tokens=1,629,312,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8487/500000] + train/ActionNoiseL2Loss=0.0838 + throughput/total_tokens=1,629,504,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8488/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=1,629,696,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=8489/500000] + train/ActionNoiseL2Loss=0.0320 + throughput/total_tokens=1,629,888,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8490/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=1,630,080,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8491/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=1,630,272,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8492/500000] + train/ActionNoiseL2Loss=0.0972 + throughput/total_tokens=1,630,464,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8493/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,630,656,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8494/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=1,630,848,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8495/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,631,040,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8496/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,631,232,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8497/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,631,424,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8498/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,631,616,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8499/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=1,631,808,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8500/500000] + optim/total_grad_norm=1.002 + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,632,000,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +10/13 [19:21:34] INFO | >> Saving config... checkpoint.py:608 +10/13 [19:22:07] INFO | >> Saving model state... checkpoint.py:796 +10/13 [19:23:16] INFO | >> Saving optim state... checkpoint.py:811 +10/13 [19:24:50] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=8501/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=1,632,192,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=8502/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,632,384,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=8503/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,632,576,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8504/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=1,632,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8505/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,632,960,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8506/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,633,152,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8507/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=1,633,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8508/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,633,536,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8509/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,633,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8510/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=1,633,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8511/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,634,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8512/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,634,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8513/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=1,634,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8514/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,634,688,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8515/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,634,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8516/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=1,635,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8517/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=1,635,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8518/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=1,635,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8519/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=1,635,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8520/500000] + optim/total_grad_norm=0.8388 + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,635,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8521/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=1,636,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8522/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=1,636,224,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8523/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,636,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8524/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=1,636,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8525/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=1,636,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8526/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,636,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8527/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,637,184,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8528/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=1,637,376,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8529/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,637,568,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8530/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,637,760,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8531/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,637,952,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8532/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=1,638,144,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8533/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,638,336,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8534/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=1,638,528,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8535/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=1,638,720,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8536/500000] + train/ActionNoiseL2Loss=0.0905 + throughput/total_tokens=1,638,912,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8537/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,639,104,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8538/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=1,639,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8539/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=1,639,488,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8540/500000] + optim/total_grad_norm=0.9060 + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,639,680,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8541/500000] + train/ActionNoiseL2Loss=0.0281 + throughput/total_tokens=1,639,872,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8542/500000] + train/ActionNoiseL2Loss=0.0776 + throughput/total_tokens=1,640,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8543/500000] + train/ActionNoiseL2Loss=0.0939 + throughput/total_tokens=1,640,256,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8544/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=1,640,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8545/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,640,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8546/500000] + train/ActionNoiseL2Loss=0.0827 + throughput/total_tokens=1,640,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8547/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=1,641,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8548/500000] + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=1,641,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8549/500000] + train/ActionNoiseL2Loss=0.0410 + throughput/total_tokens=1,641,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8550/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,641,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8551/500000] + train/ActionNoiseL2Loss=0.0218 + throughput/total_tokens=1,641,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8552/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=1,641,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8553/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=1,642,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8554/500000] + train/ActionNoiseL2Loss=0.0964 + throughput/total_tokens=1,642,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8555/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,642,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8556/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=1,642,752,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8557/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,642,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8558/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=1,643,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8559/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=1,643,328,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8560/500000] + optim/total_grad_norm=0.8147 + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=1,643,520,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=8561/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=1,643,712,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8562/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=1,643,904,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8563/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,644,096,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8564/500000] + train/ActionNoiseL2Loss=0.1016 + throughput/total_tokens=1,644,288,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8565/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=1,644,480,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8566/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=1,644,672,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8567/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,644,864,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8568/500000] + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=1,645,056,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8569/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=1,645,248,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8570/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=1,645,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8571/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,645,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8572/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=1,645,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8573/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=1,646,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8574/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=1,646,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8575/500000] + train/ActionNoiseL2Loss=0.0271 + throughput/total_tokens=1,646,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8576/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,646,592,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8577/500000] + train/ActionNoiseL2Loss=0.0792 + throughput/total_tokens=1,646,784,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8578/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=1,646,976,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8579/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,647,168,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8580/500000] + optim/total_grad_norm=0.5586 + train/ActionNoiseL2Loss=0.0340 + throughput/total_tokens=1,647,360,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8581/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,647,552,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8582/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,647,744,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8583/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=1,647,936,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8584/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,648,128,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8585/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=1,648,320,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8586/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=1,648,512,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8587/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,648,704,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8588/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=1,648,896,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8589/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,649,088,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8590/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,649,280,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8591/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=1,649,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8592/500000] + train/ActionNoiseL2Loss=0.0894 + throughput/total_tokens=1,649,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8593/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=1,649,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8594/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,650,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8595/500000] + train/ActionNoiseL2Loss=0.0779 + throughput/total_tokens=1,650,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8596/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=1,650,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8597/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,650,624,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8598/500000] + train/ActionNoiseL2Loss=0.0243 + throughput/total_tokens=1,650,816,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8599/500000] + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=1,651,008,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8600/500000] + optim/total_grad_norm=1.121 + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=1,651,200,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8601/500000] + train/ActionNoiseL2Loss=0.0993 + throughput/total_tokens=1,651,392,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=8602/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=1,651,584,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8603/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,651,776,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8604/500000] + train/ActionNoiseL2Loss=0.0313 + throughput/total_tokens=1,651,968,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8605/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,652,160,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=8606/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=1,652,352,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=8607/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=1,652,544,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8608/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=1,652,736,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8609/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,652,928,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8610/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=1,653,120,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=8611/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=1,653,312,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8612/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,653,504,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8613/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=1,653,696,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8614/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=1,653,888,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8615/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=1,654,080,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8616/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=1,654,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8617/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=1,654,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8618/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=1,654,656,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8619/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=1,654,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8620/500000] + optim/total_grad_norm=0.8034 + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=1,655,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8621/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,655,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8622/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=1,655,424,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8623/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=1,655,616,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8624/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=1,655,808,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8625/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,656,000,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8626/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=1,656,192,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8627/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,656,384,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8628/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=1,656,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8629/500000] + train/ActionNoiseL2Loss=0.0792 + throughput/total_tokens=1,656,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8630/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,656,960,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8631/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=1,657,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8632/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=1,657,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8633/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,657,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8634/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,657,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8635/500000] + train/ActionNoiseL2Loss=0.0947 + throughput/total_tokens=1,657,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8636/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,658,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8637/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,658,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8638/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,658,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8639/500000] + train/ActionNoiseL2Loss=0.0344 + throughput/total_tokens=1,658,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8640/500000] + optim/total_grad_norm=0.6668 + train/ActionNoiseL2Loss=0.0205 + throughput/total_tokens=1,658,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8641/500000] + train/ActionNoiseL2Loss=0.0359 + throughput/total_tokens=1,659,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8642/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=1,659,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8643/500000] + train/ActionNoiseL2Loss=0.0262 + throughput/total_tokens=1,659,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8644/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,659,648,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8645/500000] + train/ActionNoiseL2Loss=0.1093 + throughput/total_tokens=1,659,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8646/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,660,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8647/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,660,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8648/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=1,660,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8649/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=1,660,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8650/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=1,660,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8651/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=1,660,992,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8652/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=1,661,184,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8653/500000] + train/ActionNoiseL2Loss=0.0853 + throughput/total_tokens=1,661,376,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8654/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,661,568,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8655/500000] + train/ActionNoiseL2Loss=0.0915 + throughput/total_tokens=1,661,760,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8656/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,661,952,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8657/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=1,662,144,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8658/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=1,662,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8659/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,662,528,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8660/500000] + optim/total_grad_norm=0.8205 + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=1,662,720,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=8661/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,662,912,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8662/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=1,663,104,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8663/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=1,663,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8664/500000] + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=1,663,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8665/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=1,663,680,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8666/500000] + train/ActionNoiseL2Loss=0.0199 + throughput/total_tokens=1,663,872,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8667/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,664,064,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8668/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,664,256,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8669/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=1,664,448,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8670/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=1,664,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8671/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=1,664,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8672/500000] + train/ActionNoiseL2Loss=0.0343 + throughput/total_tokens=1,665,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8673/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=1,665,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8674/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=1,665,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8675/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=1,665,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8676/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,665,792,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8677/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=1,665,984,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8678/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=1,666,176,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8679/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=1,666,368,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8680/500000] + optim/total_grad_norm=0.9338 + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=1,666,560,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8681/500000] + train/ActionNoiseL2Loss=0.0823 + throughput/total_tokens=1,666,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8682/500000] + train/ActionNoiseL2Loss=0.0288 + throughput/total_tokens=1,666,944,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8683/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=1,667,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8684/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,667,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8685/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=1,667,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8686/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,667,712,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8687/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=1,667,904,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8688/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=1,668,096,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8689/500000] + train/ActionNoiseL2Loss=0.0261 + throughput/total_tokens=1,668,288,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8690/500000] + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=1,668,480,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8691/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,668,672,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8692/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=1,668,864,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8693/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,669,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8694/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,669,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8695/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=1,669,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8696/500000] + train/ActionNoiseL2Loss=0.0276 + throughput/total_tokens=1,669,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8697/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,669,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8698/500000] + train/ActionNoiseL2Loss=0.1242 + throughput/total_tokens=1,670,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8699/500000] + train/ActionNoiseL2Loss=0.1091 + throughput/total_tokens=1,670,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8700/500000] + optim/total_grad_norm=1.822 + train/ActionNoiseL2Loss=0.0953 + throughput/total_tokens=1,670,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8701/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,670,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8702/500000] + train/ActionNoiseL2Loss=0.0272 + throughput/total_tokens=1,670,784,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8703/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=1,670,976,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8704/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,671,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8705/500000] + train/ActionNoiseL2Loss=0.0741 + throughput/total_tokens=1,671,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8706/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,671,552,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8707/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=1,671,744,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8708/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=1,671,936,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8709/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=1,672,128,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8710/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=1,672,320,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=8711/500000] + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=1,672,512,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8712/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=1,672,704,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8713/500000] + train/ActionNoiseL2Loss=0.0244 + throughput/total_tokens=1,672,896,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8714/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=1,673,088,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8715/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=1,673,280,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8716/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=1,673,472,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8717/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=1,673,664,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8718/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=1,673,856,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8719/500000] + train/ActionNoiseL2Loss=0.1081 + throughput/total_tokens=1,674,048,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8720/500000] + optim/total_grad_norm=0.8278 + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=1,674,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8721/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=1,674,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8722/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,674,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8723/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=1,674,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8724/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=1,675,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8725/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,675,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8726/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,675,392,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8727/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=1,675,584,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8728/500000] + train/ActionNoiseL2Loss=0.0289 + throughput/total_tokens=1,675,776,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8729/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=1,675,968,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8730/500000] + train/ActionNoiseL2Loss=0.1362 + throughput/total_tokens=1,676,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8731/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,676,352,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8732/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,676,544,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8733/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,676,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8734/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=1,676,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8735/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=1,677,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8736/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,677,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8737/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,677,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8738/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,677,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8739/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,677,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8740/500000] + optim/total_grad_norm=0.8525 + train/ActionNoiseL2Loss=0.0914 + throughput/total_tokens=1,678,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8741/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,678,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8742/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,678,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8743/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=1,678,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8744/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,678,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8745/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,679,040,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8746/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,679,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8747/500000] + train/ActionNoiseL2Loss=0.0874 + throughput/total_tokens=1,679,424,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8748/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,679,616,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8749/500000] + train/ActionNoiseL2Loss=0.0776 + throughput/total_tokens=1,679,808,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8750/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=1,680,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8751/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,680,192,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8752/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,680,384,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8753/500000] + train/ActionNoiseL2Loss=0.0363 + throughput/total_tokens=1,680,576,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8754/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=1,680,768,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8755/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,680,960,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8756/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=1,681,152,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8757/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=1,681,344,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8758/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,681,536,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8759/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,681,728,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8760/500000] + optim/total_grad_norm=0.6499 + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,681,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=8761/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,682,112,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8762/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=1,682,304,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8763/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=1,682,496,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8764/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=1,682,688,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8765/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=1,682,880,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8766/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,683,072,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8767/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=1,683,264,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8768/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=1,683,456,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8769/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=1,683,648,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8770/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,683,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8771/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=1,684,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8772/500000] + train/ActionNoiseL2Loss=0.0910 + throughput/total_tokens=1,684,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8773/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,684,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8774/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,684,608,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8775/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,684,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8776/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,684,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8777/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,685,184,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8778/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,685,376,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8779/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=1,685,568,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8780/500000] + optim/total_grad_norm=0.8313 + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=1,685,760,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8781/500000] + train/ActionNoiseL2Loss=0.0753 + throughput/total_tokens=1,685,952,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8782/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=1,686,144,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8783/500000] + train/ActionNoiseL2Loss=0.0338 + throughput/total_tokens=1,686,336,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8784/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,686,528,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8785/500000] + train/ActionNoiseL2Loss=0.0772 + throughput/total_tokens=1,686,720,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8786/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=1,686,912,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8787/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,687,104,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8788/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,687,296,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8789/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=1,687,488,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8790/500000] + train/ActionNoiseL2Loss=0.0199 + throughput/total_tokens=1,687,680,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8791/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=1,687,872,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8792/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,688,064,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8793/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,688,256,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8794/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=1,688,448,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8795/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,688,640,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8796/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,688,832,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8797/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=1,689,024,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8798/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,689,216,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8799/500000] + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=1,689,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8800/500000] + optim/total_grad_norm=1.096 + train/ActionNoiseL2Loss=0.1038 + throughput/total_tokens=1,689,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8801/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=1,689,792,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8802/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=1,689,984,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8803/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,690,176,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8804/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=1,690,368,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8805/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,690,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8806/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,690,752,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8807/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=1,690,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8808/500000] + train/ActionNoiseL2Loss=0.0970 + throughput/total_tokens=1,691,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8809/500000] + train/ActionNoiseL2Loss=0.0289 + throughput/total_tokens=1,691,328,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8810/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=1,691,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=8811/500000] + train/ActionNoiseL2Loss=0.1088 + throughput/total_tokens=1,691,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8812/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,691,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8813/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=1,692,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8814/500000] + train/ActionNoiseL2Loss=0.1229 + throughput/total_tokens=1,692,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8815/500000] + train/ActionNoiseL2Loss=0.0818 + throughput/total_tokens=1,692,480,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8816/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=1,692,672,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8817/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,692,864,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8818/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,693,056,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8819/500000] + train/ActionNoiseL2Loss=0.0747 + throughput/total_tokens=1,693,248,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8820/500000] + optim/total_grad_norm=0.7426 + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=1,693,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8821/500000] + train/ActionNoiseL2Loss=0.1050 + throughput/total_tokens=1,693,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8822/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,693,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8823/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=1,694,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8824/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=1,694,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8825/500000] + train/ActionNoiseL2Loss=0.0858 + throughput/total_tokens=1,694,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8826/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=1,694,592,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8827/500000] + train/ActionNoiseL2Loss=0.0800 + throughput/total_tokens=1,694,784,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8828/500000] + train/ActionNoiseL2Loss=0.0335 + throughput/total_tokens=1,694,976,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8829/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,695,168,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8830/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=1,695,360,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8831/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=1,695,552,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8832/500000] + train/ActionNoiseL2Loss=0.1319 + throughput/total_tokens=1,695,744,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8833/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=1,695,936,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8834/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=1,696,128,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8835/500000] + train/ActionNoiseL2Loss=0.1000 + throughput/total_tokens=1,696,320,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8836/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=1,696,512,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8837/500000] + train/ActionNoiseL2Loss=0.0318 + throughput/total_tokens=1,696,704,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8838/500000] + train/ActionNoiseL2Loss=0.1051 + throughput/total_tokens=1,696,896,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8839/500000] + train/ActionNoiseL2Loss=0.0313 + throughput/total_tokens=1,697,088,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8840/500000] + optim/total_grad_norm=0.8819 + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=1,697,280,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8841/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=1,697,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8842/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=1,697,664,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8843/500000] + train/ActionNoiseL2Loss=0.0238 + throughput/total_tokens=1,697,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8844/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=1,698,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8845/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,698,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8846/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=1,698,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8847/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=1,698,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8848/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,698,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8849/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=1,699,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8850/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=1,699,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8851/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=1,699,392,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8852/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=1,699,584,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8853/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,699,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8854/500000] + train/ActionNoiseL2Loss=0.0998 + throughput/total_tokens=1,699,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8855/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,700,160,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8856/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=1,700,352,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8857/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=1,700,544,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8858/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=1,700,736,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8859/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,700,928,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8860/500000] + optim/total_grad_norm=0.4312 + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=1,701,120,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=8861/500000] + train/ActionNoiseL2Loss=0.1486 + throughput/total_tokens=1,701,312,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=8862/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=1,701,504,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8863/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,701,696,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8864/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=1,701,888,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8865/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,702,080,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8866/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=1,702,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8867/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=1,702,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8868/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,702,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8869/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,702,848,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8870/500000] + train/ActionNoiseL2Loss=0.0963 + throughput/total_tokens=1,703,040,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8871/500000] + train/ActionNoiseL2Loss=0.0335 + throughput/total_tokens=1,703,232,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=8872/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,703,424,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=8873/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,703,616,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=8874/500000] + train/ActionNoiseL2Loss=0.0290 + throughput/total_tokens=1,703,808,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=8875/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,704,000,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=8876/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=1,704,192,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=8877/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,704,384,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=8878/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,704,576,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=8879/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=1,704,768,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8880/500000] + optim/total_grad_norm=0.8626 + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,704,960,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8881/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=1,705,152,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8882/500000] + train/ActionNoiseL2Loss=0.0226 + throughput/total_tokens=1,705,344,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8883/500000] + train/ActionNoiseL2Loss=0.0297 + throughput/total_tokens=1,705,536,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8884/500000] + train/ActionNoiseL2Loss=0.1025 + throughput/total_tokens=1,705,728,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8885/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=1,705,920,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8886/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,706,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8887/500000] + train/ActionNoiseL2Loss=0.0845 + throughput/total_tokens=1,706,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8888/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,706,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8889/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=1,706,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8890/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,706,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8891/500000] + train/ActionNoiseL2Loss=0.0267 + throughput/total_tokens=1,707,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8892/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,707,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8893/500000] + train/ActionNoiseL2Loss=0.0934 + throughput/total_tokens=1,707,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8894/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,707,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8895/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,707,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8896/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,708,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8897/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=1,708,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8898/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,708,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8899/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=1,708,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8900/500000] + optim/total_grad_norm=1.013 + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=1,708,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8901/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,708,992,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8902/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=1,709,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8903/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,709,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8904/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,709,568,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8905/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,709,760,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8906/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,709,952,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8907/500000] + train/ActionNoiseL2Loss=0.0977 + throughput/total_tokens=1,710,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8908/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=1,710,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8909/500000] + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=1,710,528,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8910/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=1,710,720,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=8911/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=1,710,912,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8912/500000] + train/ActionNoiseL2Loss=0.0296 + throughput/total_tokens=1,711,104,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8913/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,711,296,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8914/500000] + train/ActionNoiseL2Loss=0.0330 + throughput/total_tokens=1,711,488,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8915/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,711,680,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8916/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,711,872,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8917/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,712,064,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8918/500000] + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=1,712,256,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8919/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,712,448,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=8920/500000] + optim/total_grad_norm=0.6992 + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=1,712,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8921/500000] + train/ActionNoiseL2Loss=0.1040 + throughput/total_tokens=1,712,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8922/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=1,713,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8923/500000] + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=1,713,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8924/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=1,713,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8925/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,713,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8926/500000] + train/ActionNoiseL2Loss=0.0967 + throughput/total_tokens=1,713,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8927/500000] + train/ActionNoiseL2Loss=0.0802 + throughput/total_tokens=1,713,984,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8928/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,714,176,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=8929/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,714,368,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8930/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=1,714,560,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8931/500000] + train/ActionNoiseL2Loss=0.0251 + throughput/total_tokens=1,714,752,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8932/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=1,714,944,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8933/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,715,136,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8934/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,715,328,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8935/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=1,715,520,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8936/500000] + train/ActionNoiseL2Loss=0.0303 + throughput/total_tokens=1,715,712,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8937/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,715,904,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8938/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,716,096,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8939/500000] + train/ActionNoiseL2Loss=0.0259 + throughput/total_tokens=1,716,288,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8940/500000] + optim/total_grad_norm=0.5967 + train/ActionNoiseL2Loss=0.0238 + throughput/total_tokens=1,716,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=8941/500000] + train/ActionNoiseL2Loss=0.0981 + throughput/total_tokens=1,716,672,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8942/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,716,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8943/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=1,717,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8944/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,717,248,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8945/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=1,717,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8946/500000] + train/ActionNoiseL2Loss=0.0956 + throughput/total_tokens=1,717,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8947/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,717,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8948/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=1,718,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8949/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=1,718,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8950/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=1,718,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8951/500000] + train/ActionNoiseL2Loss=0.0876 + throughput/total_tokens=1,718,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8952/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=1,718,784,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=8953/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=1,718,976,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=8954/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,719,168,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=8955/500000] + train/ActionNoiseL2Loss=0.0715 + throughput/total_tokens=1,719,360,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=8956/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=1,719,552,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=8957/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=1,719,744,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8958/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=1,719,936,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=8959/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,720,128,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=8960/500000] + optim/total_grad_norm=0.7140 + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,720,320,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=8961/500000] + train/ActionNoiseL2Loss=0.1075 + throughput/total_tokens=1,720,512,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8962/500000] + train/ActionNoiseL2Loss=0.0909 + throughput/total_tokens=1,720,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8963/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=1,720,896,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8964/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,721,088,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8965/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=1,721,280,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8966/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=1,721,472,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=8967/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=1,721,664,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8968/500000] + train/ActionNoiseL2Loss=0.0313 + throughput/total_tokens=1,721,856,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8969/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=1,722,048,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=8970/500000] + train/ActionNoiseL2Loss=0.0843 + throughput/total_tokens=1,722,240,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8971/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=1,722,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8972/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=1,722,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8973/500000] + train/ActionNoiseL2Loss=0.0909 + throughput/total_tokens=1,722,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8974/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=1,723,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8975/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,723,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8976/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=1,723,392,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8977/500000] + train/ActionNoiseL2Loss=0.1079 + throughput/total_tokens=1,723,584,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=8978/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=1,723,776,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8979/500000] + train/ActionNoiseL2Loss=0.0831 + throughput/total_tokens=1,723,968,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8980/500000] + optim/total_grad_norm=0.9979 + train/ActionNoiseL2Loss=0.0843 + throughput/total_tokens=1,724,160,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8981/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=1,724,352,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8982/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=1,724,544,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8983/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=1,724,736,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8984/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=1,724,928,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8985/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=1,725,120,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8986/500000] + train/ActionNoiseL2Loss=0.0926 + throughput/total_tokens=1,725,312,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8987/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=1,725,504,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8988/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=1,725,696,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8989/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=1,725,888,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8990/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,726,080,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=8991/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,726,272,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8992/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=1,726,464,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8993/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=1,726,656,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8994/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=1,726,848,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8995/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=1,727,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8996/500000] + train/ActionNoiseL2Loss=0.1006 + throughput/total_tokens=1,727,232,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=8997/500000] + train/ActionNoiseL2Loss=0.0823 + throughput/total_tokens=1,727,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8998/500000] + train/ActionNoiseL2Loss=0.1073 + throughput/total_tokens=1,727,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=8999/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=1,727,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9000/500000] + optim/total_grad_norm=0.9845 + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=1,728,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +10/13 [22:20:17] INFO | >> Saving config... checkpoint.py:608 +10/13 [22:21:11] INFO | >> Saving model state... checkpoint.py:796 +10/13 [22:22:24] INFO | >> Saving optim state... checkpoint.py:811 +10/13 [22:23:56] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=9001/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=1,728,192,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0475 +[step=9002/500000] + train/ActionNoiseL2Loss=0.1028 + throughput/total_tokens=1,728,384,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=9003/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=1,728,576,000 + throughput/device/tokens_per_second=1,137 + throughput/device/batches_per_second=0.0474 +[step=9004/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,728,768,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0475 +[step=9005/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=1,728,960,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=9006/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=1,729,152,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9007/500000] + train/ActionNoiseL2Loss=0.0941 + throughput/total_tokens=1,729,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9008/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,729,536,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9009/500000] + train/ActionNoiseL2Loss=0.0867 + throughput/total_tokens=1,729,728,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9010/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,729,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=9011/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,730,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9012/500000] + train/ActionNoiseL2Loss=0.0940 + throughput/total_tokens=1,730,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9013/500000] + train/ActionNoiseL2Loss=0.0318 + throughput/total_tokens=1,730,496,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9014/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=1,730,688,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9015/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,730,880,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9016/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,731,072,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9017/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=1,731,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9018/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,731,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9019/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,731,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9020/500000] + optim/total_grad_norm=0.7315 + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=1,731,840,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=9021/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,732,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9022/500000] + train/ActionNoiseL2Loss=0.0206 + throughput/total_tokens=1,732,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9023/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=1,732,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9024/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=1,732,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9025/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,732,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9026/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,732,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9027/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=1,733,184,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9028/500000] + train/ActionNoiseL2Loss=0.0294 + throughput/total_tokens=1,733,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9029/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=1,733,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9030/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,733,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9031/500000] + train/ActionNoiseL2Loss=0.0826 + throughput/total_tokens=1,733,952,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9032/500000] + train/ActionNoiseL2Loss=0.0289 + throughput/total_tokens=1,734,144,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9033/500000] + train/ActionNoiseL2Loss=0.0411 + throughput/total_tokens=1,734,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9034/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,734,528,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9035/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=1,734,720,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9036/500000] + train/ActionNoiseL2Loss=0.1415 + throughput/total_tokens=1,734,912,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9037/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=1,735,104,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9038/500000] + train/ActionNoiseL2Loss=0.0385 + throughput/total_tokens=1,735,296,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9039/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,735,488,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9040/500000] + optim/total_grad_norm=0.6219 + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,735,680,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9041/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=1,735,872,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9042/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,736,064,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9043/500000] + train/ActionNoiseL2Loss=0.1021 + throughput/total_tokens=1,736,256,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9044/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=1,736,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9045/500000] + train/ActionNoiseL2Loss=0.0326 + throughput/total_tokens=1,736,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9046/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=1,736,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9047/500000] + train/ActionNoiseL2Loss=0.0297 + throughput/total_tokens=1,737,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9048/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=1,737,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9049/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=1,737,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9050/500000] + train/ActionNoiseL2Loss=0.0840 + throughput/total_tokens=1,737,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9051/500000] + train/ActionNoiseL2Loss=0.1481 + throughput/total_tokens=1,737,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9052/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,737,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9053/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=1,738,176,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9054/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,738,368,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9055/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,738,560,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9056/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,738,752,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9057/500000] + train/ActionNoiseL2Loss=0.0907 + throughput/total_tokens=1,738,944,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9058/500000] + train/ActionNoiseL2Loss=0.0859 + throughput/total_tokens=1,739,136,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9059/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,739,328,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9060/500000] + optim/total_grad_norm=1.121 + train/ActionNoiseL2Loss=0.0230 + throughput/total_tokens=1,739,520,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=9061/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,739,712,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9062/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=1,739,904,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9063/500000] + train/ActionNoiseL2Loss=0.0932 + throughput/total_tokens=1,740,096,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9064/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=1,740,288,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9065/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,740,480,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9066/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=1,740,672,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9067/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=1,740,864,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9068/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,741,056,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9069/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=1,741,248,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9070/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,741,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9071/500000] + train/ActionNoiseL2Loss=0.0297 + throughput/total_tokens=1,741,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9072/500000] + train/ActionNoiseL2Loss=0.0339 + throughput/total_tokens=1,741,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9073/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=1,742,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9074/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,742,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9075/500000] + train/ActionNoiseL2Loss=0.0408 + throughput/total_tokens=1,742,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9076/500000] + train/ActionNoiseL2Loss=0.0191 + throughput/total_tokens=1,742,592,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9077/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=1,742,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9078/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=1,742,976,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9079/500000] + train/ActionNoiseL2Loss=0.0688 + throughput/total_tokens=1,743,168,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9080/500000] + optim/total_grad_norm=0.7047 + train/ActionNoiseL2Loss=0.0196 + throughput/total_tokens=1,743,360,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9081/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=1,743,552,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9082/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,743,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9083/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=1,743,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9084/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,744,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9085/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=1,744,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9086/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,744,512,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9087/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,744,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9088/500000] + train/ActionNoiseL2Loss=0.0305 + throughput/total_tokens=1,744,896,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9089/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=1,745,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9090/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,745,280,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9091/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=1,745,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9092/500000] + train/ActionNoiseL2Loss=0.1078 + throughput/total_tokens=1,745,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9093/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,745,856,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9094/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=1,746,048,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9095/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,746,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9096/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,746,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9097/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=1,746,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9098/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=1,746,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9099/500000] + train/ActionNoiseL2Loss=0.0824 + throughput/total_tokens=1,747,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9100/500000] + optim/total_grad_norm=1.043 + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,747,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9101/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=1,747,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9102/500000] + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=1,747,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9103/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,747,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9104/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,747,968,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9105/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,748,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9106/500000] + train/ActionNoiseL2Loss=0.0311 + throughput/total_tokens=1,748,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9107/500000] + train/ActionNoiseL2Loss=0.0752 + throughput/total_tokens=1,748,544,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9108/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=1,748,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9109/500000] + train/ActionNoiseL2Loss=0.0916 + throughput/total_tokens=1,748,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9110/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=1,749,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=9111/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=1,749,312,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9112/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=1,749,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9113/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=1,749,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9114/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,749,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9115/500000] + train/ActionNoiseL2Loss=0.0547 + throughput/total_tokens=1,750,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9116/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=1,750,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9117/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,750,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9118/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,750,656,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9119/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,750,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9120/500000] + optim/total_grad_norm=0.7699 + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=1,751,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9121/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,751,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9122/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,751,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9123/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=1,751,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9124/500000] + train/ActionNoiseL2Loss=0.0205 + throughput/total_tokens=1,751,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9125/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=1,752,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9126/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=1,752,192,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9127/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=1,752,384,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=9128/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=1,752,576,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9129/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,752,768,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9130/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,752,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9131/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,753,152,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9132/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,753,344,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9133/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=1,753,536,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9134/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,753,728,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9135/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,753,920,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9136/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,754,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9137/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=1,754,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9138/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,754,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9139/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=1,754,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9140/500000] + optim/total_grad_norm=0.8864 + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=1,754,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9141/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,755,072,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9142/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=1,755,264,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9143/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=1,755,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9144/500000] + train/ActionNoiseL2Loss=0.0316 + throughput/total_tokens=1,755,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9145/500000] + train/ActionNoiseL2Loss=0.1180 + throughput/total_tokens=1,755,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9146/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=1,756,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9147/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=1,756,224,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9148/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=1,756,416,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9149/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=1,756,608,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9150/500000] + train/ActionNoiseL2Loss=0.0208 + throughput/total_tokens=1,756,800,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=9151/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=1,756,992,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9152/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=1,757,184,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9153/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,757,376,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9154/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,757,568,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9155/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=1,757,760,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9156/500000] + train/ActionNoiseL2Loss=0.0916 + throughput/total_tokens=1,757,952,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9157/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=1,758,144,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9158/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,758,336,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9159/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,758,528,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9160/500000] + optim/total_grad_norm=0.8307 + train/ActionNoiseL2Loss=0.0864 + throughput/total_tokens=1,758,720,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=9161/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=1,758,912,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9162/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,759,104,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9163/500000] + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=1,759,296,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9164/500000] + train/ActionNoiseL2Loss=0.0863 + throughput/total_tokens=1,759,488,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9165/500000] + train/ActionNoiseL2Loss=0.0203 + throughput/total_tokens=1,759,680,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9166/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=1,759,872,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9167/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,760,064,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9168/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=1,760,256,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9169/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,760,448,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9170/500000] + train/ActionNoiseL2Loss=0.0983 + throughput/total_tokens=1,760,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9171/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,760,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9172/500000] + train/ActionNoiseL2Loss=0.0849 + throughput/total_tokens=1,761,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9173/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=1,761,216,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9174/500000] + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=1,761,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9175/500000] + train/ActionNoiseL2Loss=0.0809 + throughput/total_tokens=1,761,600,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9176/500000] + train/ActionNoiseL2Loss=0.0917 + throughput/total_tokens=1,761,792,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9177/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=1,761,984,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9178/500000] + train/ActionNoiseL2Loss=0.0290 + throughput/total_tokens=1,762,176,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9179/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=1,762,368,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9180/500000] + optim/total_grad_norm=1.010 + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=1,762,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9181/500000] + train/ActionNoiseL2Loss=0.0928 + throughput/total_tokens=1,762,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9182/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,762,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9183/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,763,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9184/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=1,763,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9185/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=1,763,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9186/500000] + train/ActionNoiseL2Loss=0.0297 + throughput/total_tokens=1,763,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9187/500000] + train/ActionNoiseL2Loss=0.1024 + throughput/total_tokens=1,763,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9188/500000] + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=1,764,096,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9189/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,764,288,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9190/500000] + train/ActionNoiseL2Loss=0.1033 + throughput/total_tokens=1,764,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9191/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=1,764,672,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9192/500000] + train/ActionNoiseL2Loss=0.0936 + throughput/total_tokens=1,764,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9193/500000] + train/ActionNoiseL2Loss=0.0234 + throughput/total_tokens=1,765,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9194/500000] + train/ActionNoiseL2Loss=0.0958 + throughput/total_tokens=1,765,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=9195/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,765,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9196/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=1,765,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=9197/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,765,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9198/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=1,766,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9199/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,766,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9200/500000] + optim/total_grad_norm=0.8623 + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=1,766,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9201/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=1,766,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9202/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,766,784,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9203/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,766,976,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9204/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=1,767,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9205/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=1,767,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9206/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=1,767,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9207/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=1,767,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9208/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,767,936,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9209/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=1,768,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9210/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=1,768,320,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=9211/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,768,512,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9212/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,768,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9213/500000] + train/ActionNoiseL2Loss=0.0181 + throughput/total_tokens=1,768,896,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9214/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=1,769,088,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9215/500000] + train/ActionNoiseL2Loss=0.0757 + throughput/total_tokens=1,769,280,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9216/500000] + train/ActionNoiseL2Loss=0.0890 + throughput/total_tokens=1,769,472,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9217/500000] + train/ActionNoiseL2Loss=0.0315 + throughput/total_tokens=1,769,664,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9218/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=1,769,856,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9219/500000] + train/ActionNoiseL2Loss=0.0691 + throughput/total_tokens=1,770,048,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9220/500000] + optim/total_grad_norm=0.7572 + train/ActionNoiseL2Loss=0.0408 + throughput/total_tokens=1,770,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9221/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=1,770,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9222/500000] + train/ActionNoiseL2Loss=0.1103 + throughput/total_tokens=1,770,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9223/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,770,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9224/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=1,771,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9225/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=1,771,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9226/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,771,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9227/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=1,771,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9228/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,771,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9229/500000] + train/ActionNoiseL2Loss=0.0330 + throughput/total_tokens=1,771,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9230/500000] + train/ActionNoiseL2Loss=0.0331 + throughput/total_tokens=1,772,160,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9231/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,772,352,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9232/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=1,772,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9233/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,772,736,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9234/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,772,928,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9235/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=1,773,120,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9236/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=1,773,312,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9237/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=1,773,504,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9238/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,773,696,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9239/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,773,888,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9240/500000] + optim/total_grad_norm=1.111 + train/ActionNoiseL2Loss=0.0835 + throughput/total_tokens=1,774,080,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9241/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,774,272,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9242/500000] + train/ActionNoiseL2Loss=0.0981 + throughput/total_tokens=1,774,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9243/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,774,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9244/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=1,774,848,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9245/500000] + train/ActionNoiseL2Loss=0.0387 + throughput/total_tokens=1,775,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9246/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,775,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9247/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,775,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9248/500000] + train/ActionNoiseL2Loss=0.0879 + throughput/total_tokens=1,775,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9249/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,775,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9250/500000] + train/ActionNoiseL2Loss=0.1396 + throughput/total_tokens=1,776,000,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=9251/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=1,776,192,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9252/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,776,384,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9253/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,776,576,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9254/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,776,768,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9255/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,776,960,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9256/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,777,152,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9257/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=1,777,344,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9258/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=1,777,536,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9259/500000] + train/ActionNoiseL2Loss=0.0886 + throughput/total_tokens=1,777,728,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9260/500000] + optim/total_grad_norm=1.005 + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=1,777,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9261/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=1,778,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9262/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=1,778,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9263/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=1,778,496,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9264/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=1,778,688,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9265/500000] + train/ActionNoiseL2Loss=0.0886 + throughput/total_tokens=1,778,880,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9266/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=1,779,072,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9267/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=1,779,264,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9268/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,779,456,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9269/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=1,779,648,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9270/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=1,779,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9271/500000] + train/ActionNoiseL2Loss=0.1326 + throughput/total_tokens=1,780,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9272/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=1,780,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9273/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=1,780,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9274/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,780,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9275/500000] + train/ActionNoiseL2Loss=0.1183 + throughput/total_tokens=1,780,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9276/500000] + train/ActionNoiseL2Loss=0.0876 + throughput/total_tokens=1,780,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9277/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=1,781,184,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9278/500000] + train/ActionNoiseL2Loss=0.0849 + throughput/total_tokens=1,781,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9279/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=1,781,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9280/500000] + optim/total_grad_norm=0.8172 + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,781,760,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9281/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,781,952,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9282/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=1,782,144,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9283/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=1,782,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9284/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,782,528,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9285/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,782,720,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9286/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=1,782,912,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9287/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,783,104,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9288/500000] + train/ActionNoiseL2Loss=0.0332 + throughput/total_tokens=1,783,296,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9289/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,783,488,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9290/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=1,783,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9291/500000] + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=1,783,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9292/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,784,064,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9293/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=1,784,256,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9294/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,784,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9295/500000] + train/ActionNoiseL2Loss=0.0826 + throughput/total_tokens=1,784,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9296/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,784,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9297/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=1,785,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9298/500000] + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=1,785,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9299/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=1,785,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9300/500000] + optim/total_grad_norm=0.7337 + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,785,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9301/500000] + train/ActionNoiseL2Loss=0.0892 + throughput/total_tokens=1,785,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9302/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=1,785,984,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9303/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,786,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9304/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=1,786,368,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9305/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=1,786,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9306/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,786,752,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9307/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=1,786,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9308/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,787,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9309/500000] + train/ActionNoiseL2Loss=0.0283 + throughput/total_tokens=1,787,328,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9310/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=1,787,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=9311/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,787,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9312/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,787,904,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9313/500000] + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=1,788,096,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9314/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=1,788,288,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9315/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=1,788,480,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9316/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,788,672,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9317/500000] + train/ActionNoiseL2Loss=0.0946 + throughput/total_tokens=1,788,864,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9318/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,789,056,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9319/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=1,789,248,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9320/500000] + optim/total_grad_norm=0.6581 + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=1,789,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9321/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,789,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9322/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,789,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9323/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,790,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9324/500000] + train/ActionNoiseL2Loss=0.0849 + throughput/total_tokens=1,790,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9325/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=1,790,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9326/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,790,592,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9327/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=1,790,784,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9328/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,790,976,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9329/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,791,168,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9330/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=1,791,360,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9331/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,791,552,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=9332/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,791,744,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9333/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=1,791,936,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9334/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,792,128,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=9335/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=1,792,320,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=9336/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=1,792,512,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9337/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,792,704,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9338/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,792,896,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9339/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,793,088,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9340/500000] + optim/total_grad_norm=1.495 + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=1,793,280,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9341/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=1,793,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9342/500000] + train/ActionNoiseL2Loss=0.0798 + throughput/total_tokens=1,793,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9343/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,793,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9344/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=1,794,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9345/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,794,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9346/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=1,794,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9347/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=1,794,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9348/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,794,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9349/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=1,795,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9350/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=1,795,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9351/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=1,795,392,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9352/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=1,795,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9353/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,795,776,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9354/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=1,795,968,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9355/500000] + train/ActionNoiseL2Loss=0.0313 + throughput/total_tokens=1,796,160,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9356/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=1,796,352,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9357/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=1,796,544,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9358/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,796,736,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9359/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,796,928,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9360/500000] + optim/total_grad_norm=1.051 + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=1,797,120,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=9361/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=1,797,312,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9362/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,797,504,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9363/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=1,797,696,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9364/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,797,888,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9365/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=1,798,080,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9366/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=1,798,272,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9367/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=1,798,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9368/500000] + train/ActionNoiseL2Loss=0.1065 + throughput/total_tokens=1,798,656,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9369/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,798,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9370/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=1,799,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9371/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=1,799,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9372/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=1,799,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9373/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=1,799,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9374/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=1,799,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9375/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=1,800,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9376/500000] + train/ActionNoiseL2Loss=0.0871 + throughput/total_tokens=1,800,192,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9377/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=1,800,384,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9378/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=1,800,576,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9379/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=1,800,768,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9380/500000] + optim/total_grad_norm=0.8290 + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=1,800,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9381/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=1,801,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9382/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,801,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9383/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=1,801,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9384/500000] + train/ActionNoiseL2Loss=0.0867 + throughput/total_tokens=1,801,728,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9385/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=1,801,920,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9386/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=1,802,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9387/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=1,802,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9388/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,802,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9389/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=1,802,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9390/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,802,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9391/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=1,803,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9392/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,803,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9393/500000] + train/ActionNoiseL2Loss=0.1029 + throughput/total_tokens=1,803,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9394/500000] + train/ActionNoiseL2Loss=0.0532 + throughput/total_tokens=1,803,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9395/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=1,803,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9396/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=1,804,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9397/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,804,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9398/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=1,804,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9399/500000] + train/ActionNoiseL2Loss=0.0296 + throughput/total_tokens=1,804,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9400/500000] + optim/total_grad_norm=0.8054 + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,804,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9401/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,804,992,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9402/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=1,805,184,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9403/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,805,376,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9404/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=1,805,568,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9405/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=1,805,760,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9406/500000] + train/ActionNoiseL2Loss=0.1060 + throughput/total_tokens=1,805,952,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9407/500000] + train/ActionNoiseL2Loss=0.0303 + throughput/total_tokens=1,806,144,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9408/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,806,336,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9409/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=1,806,528,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9410/500000] + train/ActionNoiseL2Loss=0.0814 + throughput/total_tokens=1,806,720,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=9411/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=1,806,912,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9412/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,807,104,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9413/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=1,807,296,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9414/500000] + train/ActionNoiseL2Loss=0.0297 + throughput/total_tokens=1,807,488,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9415/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=1,807,680,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9416/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,807,872,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9417/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,808,064,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9418/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,808,256,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9419/500000] + train/ActionNoiseL2Loss=0.0293 + throughput/total_tokens=1,808,448,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9420/500000] + optim/total_grad_norm=0.8204 + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=1,808,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9421/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=1,808,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9422/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=1,809,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=9423/500000] + train/ActionNoiseL2Loss=0.0370 + throughput/total_tokens=1,809,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=9424/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,809,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9425/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,809,600,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9426/500000] + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=1,809,792,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9427/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,809,984,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9428/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=1,810,176,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9429/500000] + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=1,810,368,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9430/500000] + train/ActionNoiseL2Loss=0.0747 + throughput/total_tokens=1,810,560,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=9431/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,810,752,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9432/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=1,810,944,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9433/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=1,811,136,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9434/500000] + train/ActionNoiseL2Loss=0.0962 + throughput/total_tokens=1,811,328,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=9435/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=1,811,520,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=9436/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=1,811,712,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9437/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,811,904,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9438/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=1,812,096,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9439/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=1,812,288,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9440/500000] + optim/total_grad_norm=0.8513 + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=1,812,480,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=9441/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=1,812,672,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9442/500000] + train/ActionNoiseL2Loss=0.0318 + throughput/total_tokens=1,812,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=9443/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,813,056,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9444/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,813,248,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9445/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=1,813,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9446/500000] + train/ActionNoiseL2Loss=0.0895 + throughput/total_tokens=1,813,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9447/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,813,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9448/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,814,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9449/500000] + train/ActionNoiseL2Loss=0.1152 + throughput/total_tokens=1,814,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9450/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=1,814,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=9451/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=1,814,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9452/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=1,814,784,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9453/500000] + train/ActionNoiseL2Loss=0.0692 + throughput/total_tokens=1,814,976,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9454/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=1,815,168,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9455/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=1,815,360,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9456/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=1,815,552,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9457/500000] + train/ActionNoiseL2Loss=0.0776 + throughput/total_tokens=1,815,744,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9458/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=1,815,936,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9459/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,816,128,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9460/500000] + optim/total_grad_norm=0.7107 + train/ActionNoiseL2Loss=0.0865 + throughput/total_tokens=1,816,320,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=9461/500000] + train/ActionNoiseL2Loss=0.0925 + throughput/total_tokens=1,816,512,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9462/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=1,816,704,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9463/500000] + train/ActionNoiseL2Loss=0.0900 + throughput/total_tokens=1,816,896,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9464/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=1,817,088,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9465/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,817,280,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9466/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=1,817,472,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9467/500000] + train/ActionNoiseL2Loss=0.0833 + throughput/total_tokens=1,817,664,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9468/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,817,856,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9469/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,818,048,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9470/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=1,818,240,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=9471/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,818,432,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9472/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,818,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=9473/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=1,818,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=9474/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=1,819,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=9475/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=1,819,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9476/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=1,819,392,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9477/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=1,819,584,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9478/500000] + train/ActionNoiseL2Loss=0.0367 + throughput/total_tokens=1,819,776,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9479/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,819,968,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=9480/500000] + optim/total_grad_norm=0.6719 + train/ActionNoiseL2Loss=0.0845 + throughput/total_tokens=1,820,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9481/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,820,352,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9482/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,820,544,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9483/500000] + train/ActionNoiseL2Loss=0.0984 + throughput/total_tokens=1,820,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9484/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,820,928,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9485/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,821,120,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9486/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,821,312,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9487/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=1,821,504,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9488/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=1,821,696,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9489/500000] + train/ActionNoiseL2Loss=0.0919 + throughput/total_tokens=1,821,888,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9490/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,822,080,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9491/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=1,822,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9492/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,822,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9493/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=1,822,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9494/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=1,822,848,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9495/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,823,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9496/500000] + train/ActionNoiseL2Loss=0.1070 + throughput/total_tokens=1,823,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9497/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=1,823,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9498/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,823,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9499/500000] + train/ActionNoiseL2Loss=0.1168 + throughput/total_tokens=1,823,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9500/500000] + optim/total_grad_norm=0.7347 + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=1,824,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +10/14 [01:19:32] INFO | >> Saving config... checkpoint.py:608 +10/14 [01:20:14] INFO | >> Saving model state... checkpoint.py:796 +10/14 [01:21:28] INFO | >> Saving optim state... checkpoint.py:811 +10/14 [01:23:01] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=9501/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,824,192,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=9502/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,824,384,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9503/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=1,824,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9504/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=1,824,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9505/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=1,824,960,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9506/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=1,825,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9507/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=1,825,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9508/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=1,825,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9509/500000] + train/ActionNoiseL2Loss=0.1069 + throughput/total_tokens=1,825,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9510/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,825,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9511/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=1,826,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9512/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,826,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9513/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=1,826,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9514/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,826,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9515/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=1,826,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9516/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=1,827,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9517/500000] + train/ActionNoiseL2Loss=0.0880 + throughput/total_tokens=1,827,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9518/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,827,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9519/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,827,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9520/500000] + optim/total_grad_norm=0.5590 + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=1,827,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9521/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,828,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9522/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,828,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9523/500000] + train/ActionNoiseL2Loss=0.0343 + throughput/total_tokens=1,828,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9524/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=1,828,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9525/500000] + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=1,828,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9526/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,828,992,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9527/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,829,184,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9528/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,829,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9529/500000] + train/ActionNoiseL2Loss=0.1330 + throughput/total_tokens=1,829,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9530/500000] + train/ActionNoiseL2Loss=0.0772 + throughput/total_tokens=1,829,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9531/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,829,952,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9532/500000] + train/ActionNoiseL2Loss=0.1029 + throughput/total_tokens=1,830,144,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9533/500000] + train/ActionNoiseL2Loss=0.0907 + throughput/total_tokens=1,830,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9534/500000] + train/ActionNoiseL2Loss=0.0993 + throughput/total_tokens=1,830,528,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9535/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,830,720,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9536/500000] + train/ActionNoiseL2Loss=0.0809 + throughput/total_tokens=1,830,912,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9537/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=1,831,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9538/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=1,831,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9539/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=1,831,488,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9540/500000] + optim/total_grad_norm=0.7656 + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=1,831,680,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9541/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=1,831,872,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9542/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,832,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9543/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,832,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9544/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=1,832,448,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9545/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=1,832,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9546/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=1,832,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9547/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,833,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9548/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=1,833,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9549/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,833,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9550/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,833,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9551/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,833,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9552/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=1,833,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9553/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=1,834,176,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9554/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,834,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9555/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=1,834,560,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9556/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=1,834,752,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9557/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,834,944,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9558/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=1,835,136,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9559/500000] + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=1,835,328,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9560/500000] + optim/total_grad_norm=0.9644 + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=1,835,520,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=9561/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,835,712,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9562/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=1,835,904,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9563/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=1,836,096,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9564/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=1,836,288,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9565/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,836,480,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9566/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,836,672,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9567/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=1,836,864,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9568/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=1,837,056,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9569/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,837,248,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9570/500000] + train/ActionNoiseL2Loss=0.0325 + throughput/total_tokens=1,837,440,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=9571/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=1,837,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9572/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,837,824,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9573/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=1,838,016,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9574/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,838,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9575/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,838,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9576/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=1,838,592,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9577/500000] + train/ActionNoiseL2Loss=0.0329 + throughput/total_tokens=1,838,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9578/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,838,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9579/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=1,839,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9580/500000] + optim/total_grad_norm=0.9828 + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,839,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9581/500000] + train/ActionNoiseL2Loss=0.0872 + throughput/total_tokens=1,839,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9582/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=1,839,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9583/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=1,839,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9584/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=1,840,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9585/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,840,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9586/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=1,840,512,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9587/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,840,704,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9588/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,840,896,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9589/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,841,088,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=9590/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=1,841,280,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=9591/500000] + train/ActionNoiseL2Loss=0.0892 + throughput/total_tokens=1,841,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9592/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,841,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9593/500000] + train/ActionNoiseL2Loss=0.1022 + throughput/total_tokens=1,841,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=9594/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,842,048,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9595/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=1,842,240,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9596/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=1,842,432,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9597/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=1,842,624,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9598/500000] + train/ActionNoiseL2Loss=0.0328 + throughput/total_tokens=1,842,816,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9599/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=1,843,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=9600/500000] + optim/total_grad_norm=0.9818 + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=1,843,200,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=9601/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,843,392,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9602/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=1,843,584,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9603/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=1,843,776,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9604/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=1,843,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9605/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,844,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9606/500000] + train/ActionNoiseL2Loss=0.0760 + throughput/total_tokens=1,844,352,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9607/500000] + train/ActionNoiseL2Loss=0.0949 + throughput/total_tokens=1,844,544,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9608/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,844,736,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9609/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=1,844,928,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9610/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=1,845,120,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=9611/500000] + train/ActionNoiseL2Loss=0.1072 + throughput/total_tokens=1,845,312,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9612/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=1,845,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9613/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,845,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9614/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=1,845,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9615/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=1,846,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9616/500000] + train/ActionNoiseL2Loss=0.0934 + throughput/total_tokens=1,846,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9617/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,846,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9618/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,846,656,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9619/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=1,846,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9620/500000] + optim/total_grad_norm=1.017 + train/ActionNoiseL2Loss=0.0286 + throughput/total_tokens=1,847,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9621/500000] + train/ActionNoiseL2Loss=0.0843 + throughput/total_tokens=1,847,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9622/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,847,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9623/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=1,847,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9624/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,847,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9625/500000] + train/ActionNoiseL2Loss=0.0691 + throughput/total_tokens=1,848,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9626/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,848,192,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9627/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=1,848,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9628/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=1,848,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9629/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,848,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9630/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,848,960,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9631/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=1,849,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9632/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=1,849,344,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9633/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=1,849,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9634/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=1,849,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9635/500000] + train/ActionNoiseL2Loss=0.0249 + throughput/total_tokens=1,849,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9636/500000] + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=1,850,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9637/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=1,850,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9638/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=1,850,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9639/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=1,850,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9640/500000] + optim/total_grad_norm=1.391 + train/ActionNoiseL2Loss=0.0937 + throughput/total_tokens=1,850,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9641/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=1,851,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9642/500000] + train/ActionNoiseL2Loss=0.0901 + throughput/total_tokens=1,851,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9643/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,851,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9644/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=1,851,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9645/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=1,851,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9646/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=1,852,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9647/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=1,852,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9648/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=1,852,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9649/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=1,852,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9650/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=1,852,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9651/500000] + train/ActionNoiseL2Loss=0.0320 + throughput/total_tokens=1,852,992,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9652/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=1,853,184,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9653/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=1,853,376,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9654/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,853,568,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9655/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=1,853,760,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9656/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,853,952,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9657/500000] + train/ActionNoiseL2Loss=0.0332 + throughput/total_tokens=1,854,144,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9658/500000] + train/ActionNoiseL2Loss=0.1082 + throughput/total_tokens=1,854,336,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9659/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,854,528,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9660/500000] + optim/total_grad_norm=0.8225 + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=1,854,720,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=9661/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,854,912,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9662/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,855,104,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9663/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=1,855,296,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9664/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,855,488,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9665/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=1,855,680,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9666/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,855,872,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9667/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=1,856,064,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9668/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,856,256,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9669/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=1,856,448,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9670/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=1,856,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=9671/500000] + train/ActionNoiseL2Loss=0.0315 + throughput/total_tokens=1,856,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9672/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,857,024,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9673/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=1,857,216,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9674/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,857,408,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9675/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,857,600,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9676/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,857,792,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9677/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=1,857,984,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9678/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,858,176,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9679/500000] + train/ActionNoiseL2Loss=0.0305 + throughput/total_tokens=1,858,368,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9680/500000] + optim/total_grad_norm=0.7566 + train/ActionNoiseL2Loss=0.0309 + throughput/total_tokens=1,858,560,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=9681/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=1,858,752,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9682/500000] + train/ActionNoiseL2Loss=0.1054 + throughput/total_tokens=1,858,944,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9683/500000] + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=1,859,136,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9684/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=1,859,328,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9685/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=1,859,520,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9686/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,859,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9687/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,859,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9688/500000] + train/ActionNoiseL2Loss=0.0981 + throughput/total_tokens=1,860,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9689/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,860,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9690/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,860,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9691/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,860,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9692/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=1,860,864,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9693/500000] + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=1,861,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9694/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=1,861,248,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9695/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=1,861,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9696/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=1,861,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9697/500000] + train/ActionNoiseL2Loss=0.0802 + throughput/total_tokens=1,861,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9698/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=1,862,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9699/500000] + train/ActionNoiseL2Loss=0.0228 + throughput/total_tokens=1,862,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9700/500000] + optim/total_grad_norm=2.348 + train/ActionNoiseL2Loss=0.1306 + throughput/total_tokens=1,862,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9701/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=1,862,592,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9702/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,862,784,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9703/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=1,862,976,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9704/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=1,863,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9705/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,863,360,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9706/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,863,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9707/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,863,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9708/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,863,936,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9709/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,864,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9710/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=1,864,320,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=9711/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=1,864,512,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9712/500000] + train/ActionNoiseL2Loss=0.0999 + throughput/total_tokens=1,864,704,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9713/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,864,896,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9714/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=1,865,088,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9715/500000] + train/ActionNoiseL2Loss=0.0836 + throughput/total_tokens=1,865,280,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9716/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,865,472,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9717/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=1,865,664,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9718/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,865,856,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9719/500000] + train/ActionNoiseL2Loss=0.0933 + throughput/total_tokens=1,866,048,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9720/500000] + optim/total_grad_norm=0.6119 + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=1,866,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9721/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=1,866,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9722/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=1,866,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9723/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,866,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9724/500000] + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,867,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9725/500000] + train/ActionNoiseL2Loss=0.0331 + throughput/total_tokens=1,867,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9726/500000] + train/ActionNoiseL2Loss=0.0157 + throughput/total_tokens=1,867,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9727/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=1,867,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9728/500000] + train/ActionNoiseL2Loss=0.0907 + throughput/total_tokens=1,867,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9729/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=1,867,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9730/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=1,868,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9731/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=1,868,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9732/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=1,868,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9733/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,868,736,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9734/500000] + train/ActionNoiseL2Loss=0.0903 + throughput/total_tokens=1,868,928,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9735/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=1,869,120,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9736/500000] + train/ActionNoiseL2Loss=0.0870 + throughput/total_tokens=1,869,312,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9737/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=1,869,504,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9738/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,869,696,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9739/500000] + train/ActionNoiseL2Loss=0.0260 + throughput/total_tokens=1,869,888,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9740/500000] + optim/total_grad_norm=0.6059 + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,870,080,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9741/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=1,870,272,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9742/500000] + train/ActionNoiseL2Loss=0.0889 + throughput/total_tokens=1,870,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9743/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=1,870,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9744/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=1,870,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9745/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=1,871,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9746/500000] + train/ActionNoiseL2Loss=0.0927 + throughput/total_tokens=1,871,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9747/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=1,871,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9748/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=1,871,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9749/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=1,871,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9750/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=1,872,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=9751/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=1,872,192,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9752/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=1,872,384,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9753/500000] + train/ActionNoiseL2Loss=0.1132 + throughput/total_tokens=1,872,576,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9754/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,872,768,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9755/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,872,960,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9756/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,873,152,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9757/500000] + train/ActionNoiseL2Loss=0.0313 + throughput/total_tokens=1,873,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9758/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=1,873,536,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9759/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=1,873,728,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9760/500000] + optim/total_grad_norm=1.066 + train/ActionNoiseL2Loss=0.0776 + throughput/total_tokens=1,873,920,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=9761/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=1,874,112,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9762/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=1,874,304,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9763/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=1,874,496,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9764/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=1,874,688,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9765/500000] + train/ActionNoiseL2Loss=0.1087 + throughput/total_tokens=1,874,880,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9766/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=1,875,072,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9767/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=1,875,264,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9768/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=1,875,456,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9769/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=1,875,648,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9770/500000] + train/ActionNoiseL2Loss=0.0241 + throughput/total_tokens=1,875,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=9771/500000] + train/ActionNoiseL2Loss=0.0255 + throughput/total_tokens=1,876,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9772/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,876,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9773/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=1,876,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9774/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,876,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9775/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,876,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9776/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=1,876,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9777/500000] + train/ActionNoiseL2Loss=0.0752 + throughput/total_tokens=1,877,184,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9778/500000] + train/ActionNoiseL2Loss=0.0314 + throughput/total_tokens=1,877,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9779/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=1,877,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9780/500000] + optim/total_grad_norm=0.4980 + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,877,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9781/500000] + train/ActionNoiseL2Loss=0.0285 + throughput/total_tokens=1,877,952,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9782/500000] + train/ActionNoiseL2Loss=0.1289 + throughput/total_tokens=1,878,144,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9783/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,878,336,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9784/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,878,528,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9785/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=1,878,720,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9786/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,878,912,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9787/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,879,104,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9788/500000] + train/ActionNoiseL2Loss=0.0387 + throughput/total_tokens=1,879,296,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9789/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,879,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9790/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=1,879,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=9791/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,879,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9792/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=1,880,064,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9793/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,880,256,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9794/500000] + train/ActionNoiseL2Loss=0.0296 + throughput/total_tokens=1,880,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9795/500000] + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=1,880,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9796/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=1,880,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9797/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,881,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9798/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,881,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9799/500000] + train/ActionNoiseL2Loss=0.0749 + throughput/total_tokens=1,881,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9800/500000] + optim/total_grad_norm=0.4517 + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=1,881,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9801/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=1,881,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9802/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=1,881,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9803/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,882,176,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9804/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=1,882,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9805/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=1,882,560,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9806/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=1,882,752,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9807/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,882,944,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9808/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=1,883,136,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9809/500000] + train/ActionNoiseL2Loss=0.0248 + throughput/total_tokens=1,883,328,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9810/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,883,520,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=9811/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,883,712,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9812/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,883,904,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9813/500000] + train/ActionNoiseL2Loss=0.0853 + throughput/total_tokens=1,884,096,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9814/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=1,884,288,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9815/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,884,480,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9816/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,884,672,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9817/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=1,884,864,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9818/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=1,885,056,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9819/500000] + train/ActionNoiseL2Loss=0.0311 + throughput/total_tokens=1,885,248,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9820/500000] + optim/total_grad_norm=0.5911 + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=1,885,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=9821/500000] + train/ActionNoiseL2Loss=0.1039 + throughput/total_tokens=1,885,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=9822/500000] + train/ActionNoiseL2Loss=0.1428 + throughput/total_tokens=1,885,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9823/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,886,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=9824/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,886,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9825/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=1,886,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9826/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=1,886,592,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9827/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,886,784,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9828/500000] + train/ActionNoiseL2Loss=0.0387 + throughput/total_tokens=1,886,976,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9829/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=1,887,168,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9830/500000] + train/ActionNoiseL2Loss=0.0367 + throughput/total_tokens=1,887,360,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9831/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=1,887,552,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9832/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,887,744,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9833/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,887,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9834/500000] + train/ActionNoiseL2Loss=0.0709 + throughput/total_tokens=1,888,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9835/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=1,888,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9836/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,888,512,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9837/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=1,888,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9838/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,888,896,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9839/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=1,889,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9840/500000] + optim/total_grad_norm=0.7380 + train/ActionNoiseL2Loss=0.0987 + throughput/total_tokens=1,889,280,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9841/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=1,889,472,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9842/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=1,889,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9843/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,889,856,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9844/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=1,890,048,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9845/500000] + train/ActionNoiseL2Loss=0.0275 + throughput/total_tokens=1,890,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9846/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,890,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9847/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,890,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9848/500000] + train/ActionNoiseL2Loss=0.0295 + throughput/total_tokens=1,890,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9849/500000] + train/ActionNoiseL2Loss=0.0980 + throughput/total_tokens=1,891,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9850/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=1,891,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9851/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=1,891,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9852/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=1,891,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9853/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=1,891,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9854/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=1,891,968,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9855/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,892,160,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9856/500000] + train/ActionNoiseL2Loss=0.0866 + throughput/total_tokens=1,892,352,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9857/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,892,544,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9858/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=1,892,736,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9859/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=1,892,928,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9860/500000] + optim/total_grad_norm=0.5541 + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,893,120,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=9861/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,893,312,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9862/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=1,893,504,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9863/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,893,696,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9864/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=1,893,888,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9865/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=1,894,080,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9866/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,894,272,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9867/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,894,464,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9868/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=1,894,656,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9869/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,894,848,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9870/500000] + train/ActionNoiseL2Loss=0.0245 + throughput/total_tokens=1,895,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9871/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,895,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9872/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=1,895,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9873/500000] + train/ActionNoiseL2Loss=0.0282 + throughput/total_tokens=1,895,616,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9874/500000] + train/ActionNoiseL2Loss=0.0206 + throughput/total_tokens=1,895,808,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9875/500000] + train/ActionNoiseL2Loss=0.1221 + throughput/total_tokens=1,896,000,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9876/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=1,896,192,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9877/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,896,384,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9878/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,896,576,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9879/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,896,768,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9880/500000] + optim/total_grad_norm=0.7241 + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,896,960,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9881/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=1,897,152,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9882/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,897,344,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9883/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=1,897,536,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9884/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,897,728,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9885/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=1,897,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9886/500000] + train/ActionNoiseL2Loss=0.0233 + throughput/total_tokens=1,898,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9887/500000] + train/ActionNoiseL2Loss=0.0277 + throughput/total_tokens=1,898,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9888/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,898,496,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9889/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,898,688,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9890/500000] + train/ActionNoiseL2Loss=0.0725 + throughput/total_tokens=1,898,880,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9891/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=1,899,072,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9892/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=1,899,264,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9893/500000] + train/ActionNoiseL2Loss=0.0657 + throughput/total_tokens=1,899,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9894/500000] + train/ActionNoiseL2Loss=0.0822 + throughput/total_tokens=1,899,648,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9895/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=1,899,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9896/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=1,900,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9897/500000] + train/ActionNoiseL2Loss=0.0316 + throughput/total_tokens=1,900,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9898/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,900,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9899/500000] + train/ActionNoiseL2Loss=0.0298 + throughput/total_tokens=1,900,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9900/500000] + optim/total_grad_norm=0.7991 + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=1,900,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=9901/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=1,900,992,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9902/500000] + train/ActionNoiseL2Loss=0.0234 + throughput/total_tokens=1,901,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9903/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=1,901,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9904/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=1,901,568,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9905/500000] + train/ActionNoiseL2Loss=0.0165 + throughput/total_tokens=1,901,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9906/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=1,901,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9907/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=1,902,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9908/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=1,902,336,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9909/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=1,902,528,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=9910/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=1,902,720,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=9911/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=1,902,912,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9912/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=1,903,104,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9913/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=1,903,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9914/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=1,903,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9915/500000] + train/ActionNoiseL2Loss=0.0385 + throughput/total_tokens=1,903,680,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9916/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,903,872,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9917/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=1,904,064,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9918/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,904,256,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9919/500000] + train/ActionNoiseL2Loss=0.0894 + throughput/total_tokens=1,904,448,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=9920/500000] + optim/total_grad_norm=0.4870 + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=1,904,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9921/500000] + train/ActionNoiseL2Loss=0.0392 + throughput/total_tokens=1,904,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9922/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=1,905,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9923/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=1,905,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9924/500000] + train/ActionNoiseL2Loss=0.0315 + throughput/total_tokens=1,905,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9925/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=1,905,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9926/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,905,792,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9927/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,905,984,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9928/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=1,906,176,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9929/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=1,906,368,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9930/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=1,906,560,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9931/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=1,906,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9932/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=1,906,944,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9933/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=1,907,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9934/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=1,907,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9935/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,907,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9936/500000] + train/ActionNoiseL2Loss=0.0361 + throughput/total_tokens=1,907,712,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9937/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=1,907,904,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9938/500000] + train/ActionNoiseL2Loss=0.0200 + throughput/total_tokens=1,908,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9939/500000] + train/ActionNoiseL2Loss=0.0741 + throughput/total_tokens=1,908,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9940/500000] + optim/total_grad_norm=1.327 + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=1,908,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9941/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,908,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9942/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=1,908,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9943/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=1,909,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9944/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,909,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=9945/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,909,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9946/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=1,909,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9947/500000] + train/ActionNoiseL2Loss=0.0388 + throughput/total_tokens=1,909,824,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9948/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=1,910,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9949/500000] + train/ActionNoiseL2Loss=0.0674 + throughput/total_tokens=1,910,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9950/500000] + train/ActionNoiseL2Loss=0.0296 + throughput/total_tokens=1,910,400,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9951/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,910,592,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9952/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=1,910,784,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9953/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=1,910,976,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9954/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,911,168,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9955/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=1,911,360,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9956/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,911,552,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9957/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,911,744,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9958/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=1,911,936,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9959/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=1,912,128,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9960/500000] + optim/total_grad_norm=0.7734 + train/ActionNoiseL2Loss=0.0934 + throughput/total_tokens=1,912,320,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=9961/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=1,912,512,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9962/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=1,912,704,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9963/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=1,912,896,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9964/500000] + train/ActionNoiseL2Loss=0.1054 + throughput/total_tokens=1,913,088,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=9965/500000] + train/ActionNoiseL2Loss=0.0860 + throughput/total_tokens=1,913,280,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9966/500000] + train/ActionNoiseL2Loss=0.1161 + throughput/total_tokens=1,913,472,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9967/500000] + train/ActionNoiseL2Loss=0.0826 + throughput/total_tokens=1,913,664,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9968/500000] + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=1,913,856,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9969/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=1,914,048,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=9970/500000] + train/ActionNoiseL2Loss=0.0338 + throughput/total_tokens=1,914,240,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=9971/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,914,432,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9972/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=1,914,624,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9973/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,914,816,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=9974/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=1,915,008,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9975/500000] + train/ActionNoiseL2Loss=0.1388 + throughput/total_tokens=1,915,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9976/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=1,915,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9977/500000] + train/ActionNoiseL2Loss=0.0290 + throughput/total_tokens=1,915,584,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9978/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=1,915,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9979/500000] + train/ActionNoiseL2Loss=0.0408 + throughput/total_tokens=1,915,968,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9980/500000] + optim/total_grad_norm=0.8517 + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=1,916,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9981/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=1,916,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9982/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=1,916,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9983/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,916,736,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9984/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=1,916,928,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9985/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=1,917,120,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9986/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=1,917,312,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9987/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,917,504,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9988/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=1,917,696,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9989/500000] + train/ActionNoiseL2Loss=0.0332 + throughput/total_tokens=1,917,888,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9990/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=1,918,080,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=9991/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=1,918,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9992/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=1,918,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9993/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=1,918,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9994/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,918,848,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9995/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=1,919,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9996/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=1,919,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9997/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=1,919,424,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=9998/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=1,919,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=9999/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=1,919,808,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10000/500000] + optim/total_grad_norm=0.7299 + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,920,000,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +10/14 [04:18:33] INFO | >> Saving config... checkpoint.py:608 +10/14 [04:19:21] INFO | >> Saving model state... checkpoint.py:796 +10/14 [04:20:35] INFO | >> Saving optim state... checkpoint.py:811 +10/14 [04:22:09] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=10001/500000] + train/ActionNoiseL2Loss=0.0260 + throughput/total_tokens=1,920,192,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0475 +[step=10002/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=1,920,384,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=10003/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=1,920,576,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=10004/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=1,920,768,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=10005/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=1,920,960,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10006/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=1,921,152,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10007/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=1,921,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10008/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,921,536,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10009/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,921,728,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10010/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,921,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=10011/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=1,922,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10012/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,922,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10013/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,922,496,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10014/500000] + train/ActionNoiseL2Loss=0.0785 + throughput/total_tokens=1,922,688,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10015/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=1,922,880,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10016/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,923,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10017/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=1,923,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10018/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=1,923,456,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10019/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=1,923,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10020/500000] + optim/total_grad_norm=0.9547 + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=1,923,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=10021/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=1,924,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10022/500000] + train/ActionNoiseL2Loss=0.0389 + throughput/total_tokens=1,924,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10023/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=1,924,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10024/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=1,924,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10025/500000] + train/ActionNoiseL2Loss=0.0281 + throughput/total_tokens=1,924,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10026/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=1,924,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10027/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,925,184,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10028/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=1,925,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10029/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=1,925,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10030/500000] + train/ActionNoiseL2Loss=0.0980 + throughput/total_tokens=1,925,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10031/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=1,925,952,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10032/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,926,144,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10033/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=1,926,336,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10034/500000] + train/ActionNoiseL2Loss=0.0807 + throughput/total_tokens=1,926,528,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10035/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,926,720,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10036/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=1,926,912,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10037/500000] + train/ActionNoiseL2Loss=0.0847 + throughput/total_tokens=1,927,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10038/500000] + train/ActionNoiseL2Loss=0.0720 + throughput/total_tokens=1,927,296,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10039/500000] + train/ActionNoiseL2Loss=0.0778 + throughput/total_tokens=1,927,488,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10040/500000] + optim/total_grad_norm=0.8239 + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=1,927,680,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10041/500000] + train/ActionNoiseL2Loss=0.0273 + throughput/total_tokens=1,927,872,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10042/500000] + train/ActionNoiseL2Loss=0.1208 + throughput/total_tokens=1,928,064,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10043/500000] + train/ActionNoiseL2Loss=0.0295 + throughput/total_tokens=1,928,256,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10044/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=1,928,448,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10045/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,928,640,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10046/500000] + train/ActionNoiseL2Loss=0.0908 + throughput/total_tokens=1,928,832,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10047/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=1,929,024,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10048/500000] + train/ActionNoiseL2Loss=0.0859 + throughput/total_tokens=1,929,216,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10049/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=1,929,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10050/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,929,600,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10051/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,929,792,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10052/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=1,929,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10053/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=1,930,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10054/500000] + train/ActionNoiseL2Loss=0.0252 + throughput/total_tokens=1,930,368,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10055/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,930,560,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10056/500000] + train/ActionNoiseL2Loss=0.0257 + throughput/total_tokens=1,930,752,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10057/500000] + train/ActionNoiseL2Loss=0.0338 + throughput/total_tokens=1,930,944,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10058/500000] + train/ActionNoiseL2Loss=0.0230 + throughput/total_tokens=1,931,136,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10059/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=1,931,328,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10060/500000] + optim/total_grad_norm=0.6822 + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=1,931,520,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=10061/500000] + train/ActionNoiseL2Loss=0.1821 + throughput/total_tokens=1,931,712,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10062/500000] + train/ActionNoiseL2Loss=0.0271 + throughput/total_tokens=1,931,904,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10063/500000] + train/ActionNoiseL2Loss=0.0926 + throughput/total_tokens=1,932,096,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10064/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=1,932,288,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10065/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=1,932,480,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10066/500000] + train/ActionNoiseL2Loss=0.0869 + throughput/total_tokens=1,932,672,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10067/500000] + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=1,932,864,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10068/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,933,056,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10069/500000] + train/ActionNoiseL2Loss=0.1403 + throughput/total_tokens=1,933,248,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10070/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,933,440,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10071/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=1,933,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10072/500000] + train/ActionNoiseL2Loss=0.0588 + throughput/total_tokens=1,933,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10073/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=1,934,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10074/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=1,934,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10075/500000] + train/ActionNoiseL2Loss=0.0290 + throughput/total_tokens=1,934,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10076/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=1,934,592,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10077/500000] + train/ActionNoiseL2Loss=0.0254 + throughput/total_tokens=1,934,784,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10078/500000] + train/ActionNoiseL2Loss=0.1036 + throughput/total_tokens=1,934,976,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10079/500000] + train/ActionNoiseL2Loss=0.0857 + throughput/total_tokens=1,935,168,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10080/500000] + optim/total_grad_norm=1.216 + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=1,935,360,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10081/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=1,935,552,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10082/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=1,935,744,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10083/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=1,935,936,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10084/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,936,128,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10085/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=1,936,320,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10086/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=1,936,512,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10087/500000] + train/ActionNoiseL2Loss=0.0363 + throughput/total_tokens=1,936,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10088/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,936,896,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10089/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=1,937,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10090/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,937,280,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10091/500000] + train/ActionNoiseL2Loss=0.0920 + throughput/total_tokens=1,937,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10092/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,937,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10093/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=1,937,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10094/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=1,938,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10095/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=1,938,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10096/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=1,938,432,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10097/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=1,938,624,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10098/500000] + train/ActionNoiseL2Loss=0.0225 + throughput/total_tokens=1,938,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10099/500000] + train/ActionNoiseL2Loss=0.0700 + throughput/total_tokens=1,939,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10100/500000] + optim/total_grad_norm=0.6024 + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=1,939,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10101/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=1,939,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10102/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=1,939,584,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10103/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=1,939,776,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10104/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=1,939,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10105/500000] + train/ActionNoiseL2Loss=0.0254 + throughput/total_tokens=1,940,160,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10106/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,940,352,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10107/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=1,940,544,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10108/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,940,736,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10109/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=1,940,928,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10110/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=1,941,120,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=10111/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=1,941,312,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10112/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,941,504,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10113/500000] + train/ActionNoiseL2Loss=0.0755 + throughput/total_tokens=1,941,696,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10114/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=1,941,888,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10115/500000] + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=1,942,080,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10116/500000] + train/ActionNoiseL2Loss=0.0326 + throughput/total_tokens=1,942,272,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10117/500000] + train/ActionNoiseL2Loss=0.0845 + throughput/total_tokens=1,942,464,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10118/500000] + train/ActionNoiseL2Loss=0.0252 + throughput/total_tokens=1,942,656,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10119/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=1,942,848,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10120/500000] + optim/total_grad_norm=1.168 + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=1,943,040,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10121/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=1,943,232,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10122/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=1,943,424,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10123/500000] + train/ActionNoiseL2Loss=0.0331 + throughput/total_tokens=1,943,616,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10124/500000] + train/ActionNoiseL2Loss=0.0957 + throughput/total_tokens=1,943,808,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10125/500000] + train/ActionNoiseL2Loss=0.0329 + throughput/total_tokens=1,944,000,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10126/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=1,944,192,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10127/500000] + train/ActionNoiseL2Loss=0.0190 + throughput/total_tokens=1,944,384,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10128/500000] + train/ActionNoiseL2Loss=0.0324 + throughput/total_tokens=1,944,576,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10129/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=1,944,768,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10130/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=1,944,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10131/500000] + train/ActionNoiseL2Loss=0.0916 + throughput/total_tokens=1,945,152,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10132/500000] + train/ActionNoiseL2Loss=0.0603 + throughput/total_tokens=1,945,344,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10133/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,945,536,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10134/500000] + train/ActionNoiseL2Loss=0.0912 + throughput/total_tokens=1,945,728,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10135/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=1,945,920,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10136/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=1,946,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10137/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=1,946,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10138/500000] + train/ActionNoiseL2Loss=0.0741 + throughput/total_tokens=1,946,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10139/500000] + train/ActionNoiseL2Loss=0.1012 + throughput/total_tokens=1,946,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10140/500000] + optim/total_grad_norm=1.001 + train/ActionNoiseL2Loss=0.0638 + throughput/total_tokens=1,946,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10141/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=1,947,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10142/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=1,947,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10143/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,947,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10144/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=1,947,648,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10145/500000] + train/ActionNoiseL2Loss=0.0264 + throughput/total_tokens=1,947,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10146/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=1,948,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10147/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=1,948,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10148/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,948,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10149/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=1,948,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10150/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=1,948,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10151/500000] + train/ActionNoiseL2Loss=0.0240 + throughput/total_tokens=1,948,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10152/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=1,949,184,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10153/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,949,376,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10154/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=1,949,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10155/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=1,949,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10156/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=1,949,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10157/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,950,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10158/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=1,950,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10159/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=1,950,528,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10160/500000] + optim/total_grad_norm=0.6715 + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=1,950,720,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=10161/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=1,950,912,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10162/500000] + train/ActionNoiseL2Loss=0.1236 + throughput/total_tokens=1,951,104,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10163/500000] + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=1,951,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10164/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,951,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10165/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=1,951,680,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10166/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=1,951,872,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10167/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=1,952,064,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10168/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=1,952,256,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10169/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=1,952,448,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10170/500000] + train/ActionNoiseL2Loss=0.0813 + throughput/total_tokens=1,952,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10171/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,952,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10172/500000] + train/ActionNoiseL2Loss=0.0930 + throughput/total_tokens=1,953,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10173/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,953,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10174/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=1,953,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10175/500000] + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=1,953,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10176/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=1,953,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10177/500000] + train/ActionNoiseL2Loss=0.1269 + throughput/total_tokens=1,953,984,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10178/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=1,954,176,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10179/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,954,368,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10180/500000] + optim/total_grad_norm=1.019 + train/ActionNoiseL2Loss=0.0397 + throughput/total_tokens=1,954,560,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10181/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=1,954,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10182/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=1,954,944,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10183/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=1,955,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10184/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=1,955,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10185/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=1,955,520,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10186/500000] + train/ActionNoiseL2Loss=0.0264 + throughput/total_tokens=1,955,712,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10187/500000] + train/ActionNoiseL2Loss=0.1039 + throughput/total_tokens=1,955,904,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=10188/500000] + train/ActionNoiseL2Loss=0.0340 + throughput/total_tokens=1,956,096,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=10189/500000] + train/ActionNoiseL2Loss=0.0747 + throughput/total_tokens=1,956,288,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=10190/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=1,956,480,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10191/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=1,956,672,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10192/500000] + train/ActionNoiseL2Loss=0.0905 + throughput/total_tokens=1,956,864,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10193/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=1,957,056,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10194/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=1,957,248,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10195/500000] + train/ActionNoiseL2Loss=0.0226 + throughput/total_tokens=1,957,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10196/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=1,957,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10197/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=1,957,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10198/500000] + train/ActionNoiseL2Loss=0.0796 + throughput/total_tokens=1,958,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10199/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=1,958,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10200/500000] + optim/total_grad_norm=0.9511 + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,958,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10201/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,958,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10202/500000] + train/ActionNoiseL2Loss=0.0818 + throughput/total_tokens=1,958,784,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10203/500000] + train/ActionNoiseL2Loss=0.0203 + throughput/total_tokens=1,958,976,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10204/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=1,959,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10205/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,959,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10206/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=1,959,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10207/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=1,959,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10208/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,959,936,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10209/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=1,960,128,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10210/500000] + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=1,960,320,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=10211/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=1,960,512,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10212/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,960,704,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10213/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=1,960,896,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10214/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=1,961,088,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10215/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,961,280,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10216/500000] + train/ActionNoiseL2Loss=0.0944 + throughput/total_tokens=1,961,472,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10217/500000] + train/ActionNoiseL2Loss=0.0355 + throughput/total_tokens=1,961,664,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10218/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=1,961,856,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10219/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=1,962,048,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10220/500000] + optim/total_grad_norm=0.7070 + train/ActionNoiseL2Loss=0.0311 + throughput/total_tokens=1,962,240,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10221/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=1,962,432,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10222/500000] + train/ActionNoiseL2Loss=0.1021 + throughput/total_tokens=1,962,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10223/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=1,962,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10224/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=1,963,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10225/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=1,963,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10226/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=1,963,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10227/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,963,584,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10228/500000] + train/ActionNoiseL2Loss=0.0780 + throughput/total_tokens=1,963,776,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10229/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,963,968,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10230/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=1,964,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10231/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,964,352,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10232/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,964,544,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10233/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=1,964,736,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10234/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,964,928,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10235/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=1,965,120,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10236/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=1,965,312,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10237/500000] + train/ActionNoiseL2Loss=0.0872 + throughput/total_tokens=1,965,504,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10238/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=1,965,696,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10239/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,965,888,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10240/500000] + optim/total_grad_norm=0.8315 + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=1,966,080,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10241/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,966,272,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10242/500000] + train/ActionNoiseL2Loss=0.0818 + throughput/total_tokens=1,966,464,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10243/500000] + train/ActionNoiseL2Loss=0.0967 + throughput/total_tokens=1,966,656,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10244/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=1,966,848,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10245/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=1,967,040,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10246/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=1,967,232,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=10247/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=1,967,424,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10248/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=1,967,616,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10249/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=1,967,808,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=10250/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=1,968,000,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10251/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=1,968,192,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10252/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=1,968,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10253/500000] + train/ActionNoiseL2Loss=0.0896 + throughput/total_tokens=1,968,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10254/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=1,968,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10255/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=1,968,960,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10256/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=1,969,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10257/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=1,969,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10258/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=1,969,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10259/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=1,969,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10260/500000] + optim/total_grad_norm=0.4807 + train/ActionNoiseL2Loss=0.0246 + throughput/total_tokens=1,969,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10261/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=1,970,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10262/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,970,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10263/500000] + train/ActionNoiseL2Loss=0.0320 + throughput/total_tokens=1,970,496,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10264/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=1,970,688,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10265/500000] + train/ActionNoiseL2Loss=0.0985 + throughput/total_tokens=1,970,880,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10266/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=1,971,072,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10267/500000] + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=1,971,264,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10268/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=1,971,456,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10269/500000] + train/ActionNoiseL2Loss=0.1017 + throughput/total_tokens=1,971,648,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10270/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=1,971,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10271/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,972,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10272/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=1,972,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10273/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,972,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10274/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,972,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10275/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=1,972,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10276/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=1,972,992,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10277/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=1,973,184,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10278/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=1,973,376,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10279/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=1,973,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10280/500000] + optim/total_grad_norm=0.6884 + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=1,973,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10281/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=1,973,952,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10282/500000] + train/ActionNoiseL2Loss=0.0758 + throughput/total_tokens=1,974,144,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10283/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=1,974,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10284/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=1,974,528,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10285/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=1,974,720,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10286/500000] + train/ActionNoiseL2Loss=0.0411 + throughput/total_tokens=1,974,912,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10287/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=1,975,104,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10288/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=1,975,296,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10289/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=1,975,488,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10290/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=1,975,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10291/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=1,975,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10292/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=1,976,064,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10293/500000] + train/ActionNoiseL2Loss=0.0369 + throughput/total_tokens=1,976,256,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10294/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=1,976,448,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10295/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=1,976,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10296/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=1,976,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10297/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,977,024,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10298/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=1,977,216,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10299/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=1,977,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10300/500000] + optim/total_grad_norm=0.6584 + train/ActionNoiseL2Loss=0.0311 + throughput/total_tokens=1,977,600,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=10301/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=1,977,792,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10302/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=1,977,984,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10303/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,978,176,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=10304/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=1,978,368,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=10305/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=1,978,560,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=10306/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=1,978,752,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=10307/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=1,978,944,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10308/500000] + train/ActionNoiseL2Loss=0.0866 + throughput/total_tokens=1,979,136,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10309/500000] + train/ActionNoiseL2Loss=0.0802 + throughput/total_tokens=1,979,328,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10310/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=1,979,520,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=10311/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=1,979,712,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10312/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=1,979,904,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10313/500000] + train/ActionNoiseL2Loss=0.0310 + throughput/total_tokens=1,980,096,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10314/500000] + train/ActionNoiseL2Loss=0.0272 + throughput/total_tokens=1,980,288,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10315/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=1,980,480,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10316/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=1,980,672,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10317/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=1,980,864,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10318/500000] + train/ActionNoiseL2Loss=0.0712 + throughput/total_tokens=1,981,056,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10319/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=1,981,248,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10320/500000] + optim/total_grad_norm=0.9382 + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,981,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10321/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=1,981,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10322/500000] + train/ActionNoiseL2Loss=0.0275 + throughput/total_tokens=1,981,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10323/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=1,982,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10324/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=1,982,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10325/500000] + train/ActionNoiseL2Loss=0.1019 + throughput/total_tokens=1,982,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10326/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=1,982,592,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10327/500000] + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=1,982,784,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10328/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=1,982,976,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10329/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=1,983,168,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10330/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=1,983,360,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10331/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=1,983,552,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10332/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=1,983,744,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10333/500000] + train/ActionNoiseL2Loss=0.0534 + throughput/total_tokens=1,983,936,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10334/500000] + train/ActionNoiseL2Loss=0.1017 + throughput/total_tokens=1,984,128,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10335/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=1,984,320,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10336/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,984,512,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10337/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=1,984,704,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10338/500000] + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=1,984,896,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10339/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=1,985,088,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10340/500000] + optim/total_grad_norm=0.5676 + train/ActionNoiseL2Loss=0.0301 + throughput/total_tokens=1,985,280,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10341/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=1,985,472,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10342/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=1,985,664,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=10343/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=1,985,856,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=10344/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=1,986,048,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10345/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=1,986,240,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10346/500000] + train/ActionNoiseL2Loss=0.0168 + throughput/total_tokens=1,986,432,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10347/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=1,986,624,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10348/500000] + train/ActionNoiseL2Loss=0.0956 + throughput/total_tokens=1,986,816,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10349/500000] + train/ActionNoiseL2Loss=0.0298 + throughput/total_tokens=1,987,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10350/500000] + train/ActionNoiseL2Loss=0.1191 + throughput/total_tokens=1,987,200,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10351/500000] + train/ActionNoiseL2Loss=0.0744 + throughput/total_tokens=1,987,392,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10352/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=1,987,584,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10353/500000] + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=1,987,776,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10354/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=1,987,968,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10355/500000] + train/ActionNoiseL2Loss=0.0387 + throughput/total_tokens=1,988,160,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10356/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=1,988,352,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10357/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=1,988,544,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10358/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=1,988,736,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10359/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=1,988,928,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10360/500000] + optim/total_grad_norm=0.6840 + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=1,989,120,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=10361/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=1,989,312,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10362/500000] + train/ActionNoiseL2Loss=0.0833 + throughput/total_tokens=1,989,504,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10363/500000] + train/ActionNoiseL2Loss=0.0931 + throughput/total_tokens=1,989,696,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10364/500000] + train/ActionNoiseL2Loss=0.0648 + throughput/total_tokens=1,989,888,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10365/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=1,990,080,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10366/500000] + train/ActionNoiseL2Loss=0.0821 + throughput/total_tokens=1,990,272,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10367/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=1,990,464,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10368/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=1,990,656,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10369/500000] + train/ActionNoiseL2Loss=0.0229 + throughput/total_tokens=1,990,848,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10370/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=1,991,040,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10371/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=1,991,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10372/500000] + train/ActionNoiseL2Loss=0.0846 + throughput/total_tokens=1,991,424,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10373/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=1,991,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10374/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=1,991,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10375/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=1,992,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10376/500000] + train/ActionNoiseL2Loss=0.0299 + throughput/total_tokens=1,992,192,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10377/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=1,992,384,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10378/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=1,992,576,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10379/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=1,992,768,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10380/500000] + optim/total_grad_norm=1.068 + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=1,992,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10381/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=1,993,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10382/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=1,993,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10383/500000] + train/ActionNoiseL2Loss=0.0971 + throughput/total_tokens=1,993,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10384/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=1,993,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10385/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=1,993,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10386/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=1,994,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10387/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=1,994,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10388/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=1,994,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10389/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=1,994,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10390/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=1,994,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10391/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=1,995,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10392/500000] + train/ActionNoiseL2Loss=0.0387 + throughput/total_tokens=1,995,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10393/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=1,995,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10394/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=1,995,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10395/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=1,995,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10396/500000] + train/ActionNoiseL2Loss=0.0472 + throughput/total_tokens=1,996,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10397/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=1,996,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10398/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=1,996,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10399/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=1,996,608,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10400/500000] + optim/total_grad_norm=0.5587 + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=1,996,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10401/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=1,996,992,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10402/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=1,997,184,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10403/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=1,997,376,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10404/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=1,997,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10405/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=1,997,760,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10406/500000] + train/ActionNoiseL2Loss=0.0295 + throughput/total_tokens=1,997,952,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10407/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=1,998,144,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10408/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=1,998,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10409/500000] + train/ActionNoiseL2Loss=0.0752 + throughput/total_tokens=1,998,528,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10410/500000] + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=1,998,720,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=10411/500000] + train/ActionNoiseL2Loss=0.0309 + throughput/total_tokens=1,998,912,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10412/500000] + train/ActionNoiseL2Loss=0.0920 + throughput/total_tokens=1,999,104,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10413/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=1,999,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10414/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=1,999,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10415/500000] + train/ActionNoiseL2Loss=0.0926 + throughput/total_tokens=1,999,680,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10416/500000] + train/ActionNoiseL2Loss=0.0703 + throughput/total_tokens=1,999,872,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10417/500000] + train/ActionNoiseL2Loss=0.0345 + throughput/total_tokens=2,000,064,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10418/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=2,000,256,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10419/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=2,000,448,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10420/500000] + optim/total_grad_norm=0.4272 + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=2,000,640,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10421/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=2,000,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10422/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=2,001,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10423/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=2,001,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10424/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=2,001,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10425/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=2,001,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10426/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=2,001,792,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10427/500000] + train/ActionNoiseL2Loss=0.0691 + throughput/total_tokens=2,001,984,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10428/500000] + train/ActionNoiseL2Loss=0.0727 + throughput/total_tokens=2,002,176,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10429/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=2,002,368,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10430/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=2,002,560,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10431/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=2,002,752,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10432/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=2,002,944,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10433/500000] + train/ActionNoiseL2Loss=0.1006 + throughput/total_tokens=2,003,136,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10434/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=2,003,328,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10435/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=2,003,520,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10436/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=2,003,712,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10437/500000] + train/ActionNoiseL2Loss=0.0251 + throughput/total_tokens=2,003,904,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10438/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=2,004,096,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10439/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=2,004,288,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10440/500000] + optim/total_grad_norm=1.003 + train/ActionNoiseL2Loss=0.0694 + throughput/total_tokens=2,004,480,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10441/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=2,004,672,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10442/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=2,004,864,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10443/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=2,005,056,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10444/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=2,005,248,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10445/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=2,005,440,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10446/500000] + train/ActionNoiseL2Loss=0.0802 + throughput/total_tokens=2,005,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10447/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=2,005,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10448/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=2,006,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10449/500000] + train/ActionNoiseL2Loss=0.0248 + throughput/total_tokens=2,006,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10450/500000] + train/ActionNoiseL2Loss=0.0833 + throughput/total_tokens=2,006,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10451/500000] + train/ActionNoiseL2Loss=0.1205 + throughput/total_tokens=2,006,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10452/500000] + train/ActionNoiseL2Loss=0.0282 + throughput/total_tokens=2,006,784,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10453/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=2,006,976,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10454/500000] + train/ActionNoiseL2Loss=0.0710 + throughput/total_tokens=2,007,168,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10455/500000] + train/ActionNoiseL2Loss=0.0834 + throughput/total_tokens=2,007,360,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10456/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=2,007,552,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10457/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=2,007,744,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10458/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=2,007,936,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10459/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=2,008,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10460/500000] + optim/total_grad_norm=1.900 + train/ActionNoiseL2Loss=0.1048 + throughput/total_tokens=2,008,320,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=10461/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=2,008,512,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10462/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=2,008,704,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10463/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=2,008,896,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10464/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=2,009,088,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10465/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=2,009,280,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10466/500000] + train/ActionNoiseL2Loss=0.0733 + throughput/total_tokens=2,009,472,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10467/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=2,009,664,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10468/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=2,009,856,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10469/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=2,010,048,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10470/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=2,010,240,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10471/500000] + train/ActionNoiseL2Loss=0.0411 + throughput/total_tokens=2,010,432,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10472/500000] + train/ActionNoiseL2Loss=0.0995 + throughput/total_tokens=2,010,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10473/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=2,010,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10474/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=2,011,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10475/500000] + train/ActionNoiseL2Loss=0.0340 + throughput/total_tokens=2,011,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10476/500000] + train/ActionNoiseL2Loss=0.1157 + throughput/total_tokens=2,011,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10477/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=2,011,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10478/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=2,011,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10479/500000] + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=2,011,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10480/500000] + optim/total_grad_norm=0.7242 + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=2,012,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10481/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=2,012,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10482/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=2,012,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10483/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=2,012,736,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10484/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=2,012,928,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10485/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=2,013,120,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10486/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=2,013,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10487/500000] + train/ActionNoiseL2Loss=0.0773 + throughput/total_tokens=2,013,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10488/500000] + train/ActionNoiseL2Loss=0.0294 + throughput/total_tokens=2,013,696,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10489/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=2,013,888,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10490/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=2,014,080,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10491/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=2,014,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10492/500000] + train/ActionNoiseL2Loss=0.0980 + throughput/total_tokens=2,014,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10493/500000] + train/ActionNoiseL2Loss=0.1062 + throughput/total_tokens=2,014,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10494/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=2,014,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10495/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=2,015,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10496/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=2,015,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10497/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=2,015,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10498/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=2,015,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10499/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=2,015,808,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10500/500000] + optim/total_grad_norm=1.034 + train/ActionNoiseL2Loss=0.0981 + throughput/total_tokens=2,016,000,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +10/14 [07:18:01] INFO | >> Saving config... checkpoint.py:608 +10/14 [07:18:34] INFO | >> Saving model state... checkpoint.py:796 +10/14 [07:19:47] INFO | >> Saving optim state... checkpoint.py:811 +10/14 [07:21:12] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=10501/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=2,016,192,000 + throughput/device/tokens_per_second=1,127 + throughput/device/batches_per_second=0.0470 +[step=10502/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=2,016,384,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0475 +[step=10503/500000] + train/ActionNoiseL2Loss=0.0761 + throughput/total_tokens=2,016,576,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10504/500000] + train/ActionNoiseL2Loss=0.0967 + throughput/total_tokens=2,016,768,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10505/500000] + train/ActionNoiseL2Loss=0.0387 + throughput/total_tokens=2,016,960,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10506/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=2,017,152,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10507/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=2,017,344,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10508/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=2,017,536,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10509/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=2,017,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10510/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=2,017,920,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10511/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=2,018,112,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10512/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=2,018,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10513/500000] + train/ActionNoiseL2Loss=0.0221 + throughput/total_tokens=2,018,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10514/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=2,018,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10515/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=2,018,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10516/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=2,019,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10517/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=2,019,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10518/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=2,019,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10519/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=2,019,648,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10520/500000] + optim/total_grad_norm=0.4486 + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=2,019,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10521/500000] + train/ActionNoiseL2Loss=0.0731 + throughput/total_tokens=2,020,032,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10522/500000] + train/ActionNoiseL2Loss=0.1291 + throughput/total_tokens=2,020,224,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10523/500000] + train/ActionNoiseL2Loss=0.0296 + throughput/total_tokens=2,020,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10524/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=2,020,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10525/500000] + train/ActionNoiseL2Loss=0.0979 + throughput/total_tokens=2,020,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10526/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=2,020,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10527/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=2,021,184,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10528/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=2,021,376,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10529/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=2,021,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10530/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=2,021,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10531/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=2,021,952,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10532/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=2,022,144,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10533/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=2,022,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10534/500000] + train/ActionNoiseL2Loss=0.1029 + throughput/total_tokens=2,022,528,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10535/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=2,022,720,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10536/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=2,022,912,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10537/500000] + train/ActionNoiseL2Loss=0.0808 + throughput/total_tokens=2,023,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10538/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=2,023,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10539/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=2,023,488,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10540/500000] + optim/total_grad_norm=0.8212 + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=2,023,680,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10541/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=2,023,872,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10542/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=2,024,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10543/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=2,024,256,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10544/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=2,024,448,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10545/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=2,024,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10546/500000] + train/ActionNoiseL2Loss=0.0338 + throughput/total_tokens=2,024,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10547/500000] + train/ActionNoiseL2Loss=0.0224 + throughput/total_tokens=2,025,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10548/500000] + train/ActionNoiseL2Loss=0.0214 + throughput/total_tokens=2,025,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10549/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=2,025,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10550/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=2,025,600,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10551/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=2,025,792,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10552/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=2,025,984,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10553/500000] + train/ActionNoiseL2Loss=0.0230 + throughput/total_tokens=2,026,176,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10554/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=2,026,368,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10555/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=2,026,560,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10556/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=2,026,752,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10557/500000] + train/ActionNoiseL2Loss=0.0788 + throughput/total_tokens=2,026,944,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10558/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=2,027,136,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10559/500000] + train/ActionNoiseL2Loss=0.0476 + throughput/total_tokens=2,027,328,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10560/500000] + optim/total_grad_norm=0.9155 + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=2,027,520,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=10561/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=2,027,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10562/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=2,027,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10563/500000] + train/ActionNoiseL2Loss=0.0301 + throughput/total_tokens=2,028,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10564/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=2,028,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10565/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=2,028,480,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10566/500000] + train/ActionNoiseL2Loss=0.0738 + throughput/total_tokens=2,028,672,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10567/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=2,028,864,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10568/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=2,029,056,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10569/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=2,029,248,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10570/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=2,029,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10571/500000] + train/ActionNoiseL2Loss=0.1064 + throughput/total_tokens=2,029,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10572/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=2,029,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10573/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=2,030,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10574/500000] + train/ActionNoiseL2Loss=0.0759 + throughput/total_tokens=2,030,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10575/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=2,030,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10576/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=2,030,592,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10577/500000] + train/ActionNoiseL2Loss=0.1359 + throughput/total_tokens=2,030,784,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10578/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=2,030,976,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10579/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=2,031,168,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10580/500000] + optim/total_grad_norm=0.8212 + train/ActionNoiseL2Loss=0.0295 + throughput/total_tokens=2,031,360,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10581/500000] + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=2,031,552,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10582/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=2,031,744,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10583/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=2,031,936,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10584/500000] + train/ActionNoiseL2Loss=0.0752 + throughput/total_tokens=2,032,128,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10585/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=2,032,320,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10586/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=2,032,512,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10587/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=2,032,704,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10588/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=2,032,896,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10589/500000] + train/ActionNoiseL2Loss=0.0987 + throughput/total_tokens=2,033,088,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=10590/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=2,033,280,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10591/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=2,033,472,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10592/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=2,033,664,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10593/500000] + train/ActionNoiseL2Loss=0.1634 + throughput/total_tokens=2,033,856,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=10594/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=2,034,048,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10595/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=2,034,240,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10596/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=2,034,432,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10597/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=2,034,624,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=10598/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=2,034,816,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=10599/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=2,035,008,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=10600/500000] + optim/total_grad_norm=0.5134 + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=2,035,200,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10601/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=2,035,392,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10602/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=2,035,584,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10603/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=2,035,776,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10604/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=2,035,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10605/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=2,036,160,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10606/500000] + train/ActionNoiseL2Loss=0.0740 + throughput/total_tokens=2,036,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10607/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=2,036,544,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10608/500000] + train/ActionNoiseL2Loss=0.0277 + throughput/total_tokens=2,036,736,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10609/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=2,036,928,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10610/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=2,037,120,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=10611/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=2,037,312,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10612/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=2,037,504,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10613/500000] + train/ActionNoiseL2Loss=0.0845 + throughput/total_tokens=2,037,696,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10614/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=2,037,888,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10615/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=2,038,080,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10616/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=2,038,272,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10617/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=2,038,464,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10618/500000] + train/ActionNoiseL2Loss=0.0995 + throughput/total_tokens=2,038,656,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10619/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=2,038,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10620/500000] + optim/total_grad_norm=0.5240 + train/ActionNoiseL2Loss=0.0337 + throughput/total_tokens=2,039,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10621/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=2,039,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10622/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=2,039,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10623/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=2,039,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10624/500000] + train/ActionNoiseL2Loss=0.0833 + throughput/total_tokens=2,039,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10625/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=2,040,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10626/500000] + train/ActionNoiseL2Loss=0.0269 + throughput/total_tokens=2,040,192,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10627/500000] + train/ActionNoiseL2Loss=0.0978 + throughput/total_tokens=2,040,384,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10628/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=2,040,576,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10629/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=2,040,768,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10630/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=2,040,960,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10631/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=2,041,152,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=10632/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=2,041,344,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10633/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=2,041,536,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10634/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=2,041,728,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10635/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=2,041,920,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10636/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=2,042,112,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10637/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=2,042,304,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10638/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=2,042,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10639/500000] + train/ActionNoiseL2Loss=0.0185 + throughput/total_tokens=2,042,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10640/500000] + optim/total_grad_norm=0.4841 + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=2,042,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10641/500000] + train/ActionNoiseL2Loss=0.0311 + throughput/total_tokens=2,043,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10642/500000] + train/ActionNoiseL2Loss=0.0270 + throughput/total_tokens=2,043,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10643/500000] + train/ActionNoiseL2Loss=0.0569 + throughput/total_tokens=2,043,456,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10644/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=2,043,648,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10645/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=2,043,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10646/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=2,044,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10647/500000] + train/ActionNoiseL2Loss=0.0289 + throughput/total_tokens=2,044,224,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10648/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=2,044,416,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10649/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=2,044,608,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10650/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=2,044,800,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=10651/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=2,044,992,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10652/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=2,045,184,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10653/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=2,045,376,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10654/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=2,045,568,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10655/500000] + train/ActionNoiseL2Loss=0.0284 + throughput/total_tokens=2,045,760,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10656/500000] + train/ActionNoiseL2Loss=0.0326 + throughput/total_tokens=2,045,952,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=10657/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=2,046,144,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=10658/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=2,046,336,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10659/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=2,046,528,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10660/500000] + optim/total_grad_norm=0.5473 + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=2,046,720,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=10661/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=2,046,912,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10662/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=2,047,104,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10663/500000] + train/ActionNoiseL2Loss=0.0724 + throughput/total_tokens=2,047,296,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10664/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=2,047,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10665/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=2,047,680,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10666/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=2,047,872,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10667/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=2,048,064,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10668/500000] + train/ActionNoiseL2Loss=0.0312 + throughput/total_tokens=2,048,256,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10669/500000] + train/ActionNoiseL2Loss=0.0297 + throughput/total_tokens=2,048,448,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10670/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=2,048,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10671/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=2,048,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10672/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=2,049,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10673/500000] + train/ActionNoiseL2Loss=0.0326 + throughput/total_tokens=2,049,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10674/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=2,049,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10675/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=2,049,600,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10676/500000] + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=2,049,792,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10677/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=2,049,984,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10678/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=2,050,176,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10679/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=2,050,368,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10680/500000] + optim/total_grad_norm=0.9289 + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=2,050,560,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10681/500000] + train/ActionNoiseL2Loss=0.1050 + throughput/total_tokens=2,050,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10682/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=2,050,944,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10683/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=2,051,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10684/500000] + train/ActionNoiseL2Loss=0.0883 + throughput/total_tokens=2,051,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10685/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=2,051,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10686/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=2,051,712,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10687/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=2,051,904,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10688/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=2,052,096,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10689/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=2,052,288,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10690/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=2,052,480,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10691/500000] + train/ActionNoiseL2Loss=0.0312 + throughput/total_tokens=2,052,672,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10692/500000] + train/ActionNoiseL2Loss=0.0330 + throughput/total_tokens=2,052,864,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10693/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=2,053,056,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10694/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=2,053,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10695/500000] + train/ActionNoiseL2Loss=0.0367 + throughput/total_tokens=2,053,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10696/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=2,053,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10697/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=2,053,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10698/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=2,054,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10699/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=2,054,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10700/500000] + optim/total_grad_norm=0.7160 + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=2,054,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10701/500000] + train/ActionNoiseL2Loss=0.0446 + throughput/total_tokens=2,054,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10702/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=2,054,784,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10703/500000] + train/ActionNoiseL2Loss=0.0765 + throughput/total_tokens=2,054,976,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10704/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=2,055,168,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10705/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=2,055,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10706/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=2,055,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10707/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=2,055,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10708/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=2,055,936,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10709/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=2,056,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10710/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=2,056,320,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=10711/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=2,056,512,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10712/500000] + train/ActionNoiseL2Loss=0.1025 + throughput/total_tokens=2,056,704,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10713/500000] + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=2,056,896,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10714/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=2,057,088,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10715/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=2,057,280,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10716/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=2,057,472,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10717/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=2,057,664,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10718/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=2,057,856,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10719/500000] + train/ActionNoiseL2Loss=0.0850 + throughput/total_tokens=2,058,048,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10720/500000] + optim/total_grad_norm=0.6883 + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=2,058,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10721/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=2,058,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10722/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=2,058,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10723/500000] + train/ActionNoiseL2Loss=0.1254 + throughput/total_tokens=2,058,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10724/500000] + train/ActionNoiseL2Loss=0.0827 + throughput/total_tokens=2,059,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10725/500000] + train/ActionNoiseL2Loss=0.0806 + throughput/total_tokens=2,059,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10726/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=2,059,392,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10727/500000] + train/ActionNoiseL2Loss=0.0298 + throughput/total_tokens=2,059,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10728/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=2,059,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10729/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=2,059,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10730/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=2,060,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10731/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=2,060,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10732/500000] + train/ActionNoiseL2Loss=0.0607 + throughput/total_tokens=2,060,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10733/500000] + train/ActionNoiseL2Loss=0.0327 + throughput/total_tokens=2,060,736,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10734/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=2,060,928,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10735/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=2,061,120,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10736/500000] + train/ActionNoiseL2Loss=0.0766 + throughput/total_tokens=2,061,312,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10737/500000] + train/ActionNoiseL2Loss=0.0497 + throughput/total_tokens=2,061,504,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10738/500000] + train/ActionNoiseL2Loss=0.0862 + throughput/total_tokens=2,061,696,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10739/500000] + train/ActionNoiseL2Loss=0.0923 + throughput/total_tokens=2,061,888,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10740/500000] + optim/total_grad_norm=0.9992 + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=2,062,080,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10741/500000] + train/ActionNoiseL2Loss=0.0253 + throughput/total_tokens=2,062,272,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10742/500000] + train/ActionNoiseL2Loss=0.0790 + throughput/total_tokens=2,062,464,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10743/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=2,062,656,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10744/500000] + train/ActionNoiseL2Loss=0.0289 + throughput/total_tokens=2,062,848,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10745/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=2,063,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10746/500000] + train/ActionNoiseL2Loss=0.0341 + throughput/total_tokens=2,063,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10747/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=2,063,424,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10748/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=2,063,616,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10749/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=2,063,808,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10750/500000] + train/ActionNoiseL2Loss=0.0768 + throughput/total_tokens=2,064,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10751/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=2,064,192,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10752/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=2,064,384,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10753/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=2,064,576,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10754/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=2,064,768,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10755/500000] + train/ActionNoiseL2Loss=0.0872 + throughput/total_tokens=2,064,960,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10756/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=2,065,152,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10757/500000] + train/ActionNoiseL2Loss=0.0952 + throughput/total_tokens=2,065,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10758/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=2,065,536,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10759/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=2,065,728,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10760/500000] + optim/total_grad_norm=1.894 + train/ActionNoiseL2Loss=0.0928 + throughput/total_tokens=2,065,920,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=10761/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=2,066,112,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10762/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=2,066,304,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10763/500000] + train/ActionNoiseL2Loss=0.0310 + throughput/total_tokens=2,066,496,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10764/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=2,066,688,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10765/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=2,066,880,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10766/500000] + train/ActionNoiseL2Loss=0.0767 + throughput/total_tokens=2,067,072,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10767/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=2,067,264,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10768/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=2,067,456,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10769/500000] + train/ActionNoiseL2Loss=0.0354 + throughput/total_tokens=2,067,648,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10770/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=2,067,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10771/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=2,068,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10772/500000] + train/ActionNoiseL2Loss=0.0967 + throughput/total_tokens=2,068,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10773/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=2,068,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10774/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=2,068,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10775/500000] + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=2,068,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10776/500000] + train/ActionNoiseL2Loss=0.0717 + throughput/total_tokens=2,068,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10777/500000] + train/ActionNoiseL2Loss=0.0252 + throughput/total_tokens=2,069,184,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10778/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=2,069,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10779/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=2,069,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10780/500000] + optim/total_grad_norm=0.4728 + train/ActionNoiseL2Loss=0.0253 + throughput/total_tokens=2,069,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10781/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=2,069,952,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10782/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=2,070,144,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10783/500000] + train/ActionNoiseL2Loss=0.0345 + throughput/total_tokens=2,070,336,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10784/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=2,070,528,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10785/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=2,070,720,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10786/500000] + train/ActionNoiseL2Loss=0.0494 + throughput/total_tokens=2,070,912,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10787/500000] + train/ActionNoiseL2Loss=0.0218 + throughput/total_tokens=2,071,104,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10788/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=2,071,296,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10789/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=2,071,488,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10790/500000] + train/ActionNoiseL2Loss=0.0340 + throughput/total_tokens=2,071,680,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10791/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=2,071,872,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10792/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=2,072,064,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10793/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=2,072,256,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10794/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=2,072,448,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10795/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=2,072,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10796/500000] + train/ActionNoiseL2Loss=0.0929 + throughput/total_tokens=2,072,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10797/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=2,073,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10798/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=2,073,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10799/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=2,073,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10800/500000] + optim/total_grad_norm=0.7029 + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=2,073,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10801/500000] + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=2,073,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10802/500000] + train/ActionNoiseL2Loss=0.0270 + throughput/total_tokens=2,073,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10803/500000] + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=2,074,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10804/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=2,074,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10805/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=2,074,560,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10806/500000] + train/ActionNoiseL2Loss=0.0895 + throughput/total_tokens=2,074,752,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10807/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=2,074,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10808/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=2,075,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10809/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=2,075,328,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10810/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=2,075,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=10811/500000] + train/ActionNoiseL2Loss=0.0539 + throughput/total_tokens=2,075,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10812/500000] + train/ActionNoiseL2Loss=0.0217 + throughput/total_tokens=2,075,904,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10813/500000] + train/ActionNoiseL2Loss=0.0309 + throughput/total_tokens=2,076,096,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10814/500000] + train/ActionNoiseL2Loss=0.0815 + throughput/total_tokens=2,076,288,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10815/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=2,076,480,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10816/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=2,076,672,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10817/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=2,076,864,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10818/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=2,077,056,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10819/500000] + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=2,077,248,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10820/500000] + optim/total_grad_norm=0.7852 + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=2,077,440,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10821/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=2,077,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10822/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=2,077,824,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10823/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=2,078,016,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10824/500000] + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=2,078,208,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10825/500000] + train/ActionNoiseL2Loss=0.0891 + throughput/total_tokens=2,078,400,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10826/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=2,078,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10827/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=2,078,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10828/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=2,078,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10829/500000] + train/ActionNoiseL2Loss=0.0284 + throughput/total_tokens=2,079,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10830/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=2,079,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10831/500000] + train/ActionNoiseL2Loss=0.0340 + throughput/total_tokens=2,079,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10832/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=2,079,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10833/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=2,079,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10834/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=2,080,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10835/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=2,080,320,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10836/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=2,080,512,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10837/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=2,080,704,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10838/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=2,080,896,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10839/500000] + train/ActionNoiseL2Loss=0.0900 + throughput/total_tokens=2,081,088,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10840/500000] + optim/total_grad_norm=0.8971 + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=2,081,280,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10841/500000] + train/ActionNoiseL2Loss=0.0664 + throughput/total_tokens=2,081,472,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10842/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=2,081,664,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10843/500000] + train/ActionNoiseL2Loss=0.0555 + throughput/total_tokens=2,081,856,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10844/500000] + train/ActionNoiseL2Loss=0.0904 + throughput/total_tokens=2,082,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10845/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=2,082,240,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10846/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=2,082,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10847/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=2,082,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10848/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=2,082,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10849/500000] + train/ActionNoiseL2Loss=0.0366 + throughput/total_tokens=2,083,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10850/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=2,083,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10851/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=2,083,392,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10852/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=2,083,584,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10853/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=2,083,776,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10854/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=2,083,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10855/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=2,084,160,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10856/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=2,084,352,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10857/500000] + train/ActionNoiseL2Loss=0.0745 + throughput/total_tokens=2,084,544,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10858/500000] + train/ActionNoiseL2Loss=0.0656 + throughput/total_tokens=2,084,736,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10859/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=2,084,928,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10860/500000] + optim/total_grad_norm=0.8742 + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=2,085,120,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=10861/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=2,085,312,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10862/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=2,085,504,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10863/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=2,085,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10864/500000] + train/ActionNoiseL2Loss=0.0631 + throughput/total_tokens=2,085,888,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10865/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=2,086,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10866/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=2,086,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10867/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=2,086,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10868/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=2,086,656,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10869/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=2,086,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10870/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=2,087,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10871/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=2,087,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10872/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=2,087,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10873/500000] + train/ActionNoiseL2Loss=0.1089 + throughput/total_tokens=2,087,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10874/500000] + train/ActionNoiseL2Loss=0.0310 + throughput/total_tokens=2,087,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10875/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=2,088,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10876/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=2,088,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10877/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=2,088,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10878/500000] + train/ActionNoiseL2Loss=0.0278 + throughput/total_tokens=2,088,576,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10879/500000] + train/ActionNoiseL2Loss=0.0370 + throughput/total_tokens=2,088,768,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10880/500000] + optim/total_grad_norm=0.9605 + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=2,088,960,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=10881/500000] + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=2,089,152,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10882/500000] + train/ActionNoiseL2Loss=0.1030 + throughput/total_tokens=2,089,344,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10883/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=2,089,536,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10884/500000] + train/ActionNoiseL2Loss=0.0363 + throughput/total_tokens=2,089,728,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10885/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=2,089,920,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10886/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=2,090,112,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10887/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=2,090,304,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10888/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=2,090,496,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10889/500000] + train/ActionNoiseL2Loss=0.0925 + throughput/total_tokens=2,090,688,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10890/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=2,090,880,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=10891/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=2,091,072,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10892/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=2,091,264,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10893/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=2,091,456,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10894/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=2,091,648,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10895/500000] + train/ActionNoiseL2Loss=0.0739 + throughput/total_tokens=2,091,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10896/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=2,092,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10897/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=2,092,224,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10898/500000] + train/ActionNoiseL2Loss=0.0437 + throughput/total_tokens=2,092,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10899/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=2,092,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10900/500000] + optim/total_grad_norm=0.8769 + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=2,092,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10901/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=2,092,992,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10902/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=2,093,184,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10903/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=2,093,376,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10904/500000] + train/ActionNoiseL2Loss=0.0823 + throughput/total_tokens=2,093,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10905/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=2,093,760,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10906/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=2,093,952,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10907/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=2,094,144,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10908/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=2,094,336,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10909/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=2,094,528,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10910/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=2,094,720,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=10911/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=2,094,912,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10912/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=2,095,104,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10913/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=2,095,296,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10914/500000] + train/ActionNoiseL2Loss=0.0308 + throughput/total_tokens=2,095,488,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10915/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=2,095,680,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10916/500000] + train/ActionNoiseL2Loss=0.0343 + throughput/total_tokens=2,095,872,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=10917/500000] + train/ActionNoiseL2Loss=0.0811 + throughput/total_tokens=2,096,064,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10918/500000] + train/ActionNoiseL2Loss=0.0677 + throughput/total_tokens=2,096,256,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10919/500000] + train/ActionNoiseL2Loss=0.0243 + throughput/total_tokens=2,096,448,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=10920/500000] + optim/total_grad_norm=0.9304 + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=2,096,640,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=10921/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=2,096,832,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10922/500000] + train/ActionNoiseL2Loss=0.0226 + throughput/total_tokens=2,097,024,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10923/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=2,097,216,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10924/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=2,097,408,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10925/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=2,097,600,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10926/500000] + train/ActionNoiseL2Loss=0.0693 + throughput/total_tokens=2,097,792,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10927/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=2,097,984,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10928/500000] + train/ActionNoiseL2Loss=0.0474 + throughput/total_tokens=2,098,176,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10929/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=2,098,368,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10930/500000] + train/ActionNoiseL2Loss=0.0620 + throughput/total_tokens=2,098,560,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=10931/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=2,098,752,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10932/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=2,098,944,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10933/500000] + train/ActionNoiseL2Loss=0.0203 + throughput/total_tokens=2,099,136,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10934/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=2,099,328,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10935/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=2,099,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10936/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=2,099,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10937/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=2,099,904,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10938/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=2,100,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10939/500000] + train/ActionNoiseL2Loss=0.0748 + throughput/total_tokens=2,100,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10940/500000] + optim/total_grad_norm=0.7417 + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=2,100,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10941/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=2,100,672,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10942/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=2,100,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10943/500000] + train/ActionNoiseL2Loss=0.0965 + throughput/total_tokens=2,101,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10944/500000] + train/ActionNoiseL2Loss=0.0943 + throughput/total_tokens=2,101,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10945/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=2,101,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=10946/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=2,101,632,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10947/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=2,101,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10948/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=2,102,016,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10949/500000] + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=2,102,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=10950/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=2,102,400,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=10951/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=2,102,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10952/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=2,102,784,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10953/500000] + train/ActionNoiseL2Loss=0.0394 + throughput/total_tokens=2,102,976,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10954/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=2,103,168,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=10955/500000] + train/ActionNoiseL2Loss=0.0294 + throughput/total_tokens=2,103,360,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10956/500000] + train/ActionNoiseL2Loss=0.0421 + throughput/total_tokens=2,103,552,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10957/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=2,103,744,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10958/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=2,103,936,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10959/500000] + train/ActionNoiseL2Loss=0.0506 + throughput/total_tokens=2,104,128,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10960/500000] + optim/total_grad_norm=1.126 + train/ActionNoiseL2Loss=0.0900 + throughput/total_tokens=2,104,320,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=10961/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=2,104,512,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10962/500000] + train/ActionNoiseL2Loss=0.0843 + throughput/total_tokens=2,104,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10963/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=2,104,896,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10964/500000] + train/ActionNoiseL2Loss=0.0551 + throughput/total_tokens=2,105,088,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=10965/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=2,105,280,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10966/500000] + train/ActionNoiseL2Loss=0.0358 + throughput/total_tokens=2,105,472,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10967/500000] + train/ActionNoiseL2Loss=0.0966 + throughput/total_tokens=2,105,664,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=10968/500000] + train/ActionNoiseL2Loss=0.0363 + throughput/total_tokens=2,105,856,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10969/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=2,106,048,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=10970/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=2,106,240,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10971/500000] + train/ActionNoiseL2Loss=0.0319 + throughput/total_tokens=2,106,432,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10972/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=2,106,624,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10973/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=2,106,816,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=10974/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=2,107,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10975/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=2,107,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10976/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=2,107,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10977/500000] + train/ActionNoiseL2Loss=0.0732 + throughput/total_tokens=2,107,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10978/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=2,107,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10979/500000] + train/ActionNoiseL2Loss=0.0618 + throughput/total_tokens=2,107,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10980/500000] + optim/total_grad_norm=1.202 + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=2,108,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10981/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=2,108,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10982/500000] + train/ActionNoiseL2Loss=0.0756 + throughput/total_tokens=2,108,544,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10983/500000] + train/ActionNoiseL2Loss=0.1137 + throughput/total_tokens=2,108,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10984/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=2,108,928,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10985/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=2,109,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10986/500000] + train/ActionNoiseL2Loss=0.0386 + throughput/total_tokens=2,109,312,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10987/500000] + train/ActionNoiseL2Loss=0.0190 + throughput/total_tokens=2,109,504,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10988/500000] + train/ActionNoiseL2Loss=0.1068 + throughput/total_tokens=2,109,696,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10989/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=2,109,888,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10990/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=2,110,080,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=10991/500000] + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=2,110,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10992/500000] + train/ActionNoiseL2Loss=0.0357 + throughput/total_tokens=2,110,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10993/500000] + train/ActionNoiseL2Loss=0.0272 + throughput/total_tokens=2,110,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10994/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=2,110,848,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=10995/500000] + train/ActionNoiseL2Loss=0.0726 + throughput/total_tokens=2,111,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10996/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=2,111,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10997/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=2,111,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10998/500000] + train/ActionNoiseL2Loss=0.1147 + throughput/total_tokens=2,111,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=10999/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=2,111,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11000/500000] + optim/total_grad_norm=0.6865 + train/ActionNoiseL2Loss=0.0584 + throughput/total_tokens=2,112,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +10/14 [10:16:56] INFO | >> Saving config... checkpoint.py:608 +10/14 [10:17:29] INFO | >> Saving model state... checkpoint.py:796 +10/14 [10:18:43] INFO | >> Saving optim state... checkpoint.py:811 +10/14 [10:20:16] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=11001/500000] + train/ActionNoiseL2Loss=0.1310 + throughput/total_tokens=2,112,192,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=11002/500000] + train/ActionNoiseL2Loss=0.0256 + throughput/total_tokens=2,112,384,000 + throughput/device/tokens_per_second=1,135 + throughput/device/batches_per_second=0.0473 +[step=11003/500000] + train/ActionNoiseL2Loss=0.0985 + throughput/total_tokens=2,112,576,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0474 +[step=11004/500000] + train/ActionNoiseL2Loss=0.0962 + throughput/total_tokens=2,112,768,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0475 +[step=11005/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=2,112,960,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=11006/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=2,113,152,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11007/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=2,113,344,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11008/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=2,113,536,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11009/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=2,113,728,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11010/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=2,113,920,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11011/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=2,114,112,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11012/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=2,114,304,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11013/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=2,114,496,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11014/500000] + train/ActionNoiseL2Loss=0.0611 + throughput/total_tokens=2,114,688,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11015/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=2,114,880,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11016/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=2,115,072,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11017/500000] + train/ActionNoiseL2Loss=0.0790 + throughput/total_tokens=2,115,264,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11018/500000] + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=2,115,456,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11019/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=2,115,648,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11020/500000] + optim/total_grad_norm=0.6903 + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=2,115,840,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11021/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=2,116,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11022/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=2,116,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11023/500000] + train/ActionNoiseL2Loss=0.0280 + throughput/total_tokens=2,116,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11024/500000] + train/ActionNoiseL2Loss=0.0209 + throughput/total_tokens=2,116,608,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11025/500000] + train/ActionNoiseL2Loss=0.0458 + throughput/total_tokens=2,116,800,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11026/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=2,116,992,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11027/500000] + train/ActionNoiseL2Loss=0.0282 + throughput/total_tokens=2,117,184,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11028/500000] + train/ActionNoiseL2Loss=0.0483 + throughput/total_tokens=2,117,376,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11029/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=2,117,568,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11030/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=2,117,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11031/500000] + train/ActionNoiseL2Loss=0.0230 + throughput/total_tokens=2,117,952,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11032/500000] + train/ActionNoiseL2Loss=0.0736 + throughput/total_tokens=2,118,144,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11033/500000] + train/ActionNoiseL2Loss=0.0467 + throughput/total_tokens=2,118,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11034/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=2,118,528,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11035/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=2,118,720,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11036/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=2,118,912,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11037/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=2,119,104,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11038/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=2,119,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11039/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=2,119,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11040/500000] + optim/total_grad_norm=0.6423 + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=2,119,680,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11041/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=2,119,872,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11042/500000] + train/ActionNoiseL2Loss=0.0570 + throughput/total_tokens=2,120,064,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11043/500000] + train/ActionNoiseL2Loss=0.0324 + throughput/total_tokens=2,120,256,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11044/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=2,120,448,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11045/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=2,120,640,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11046/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=2,120,832,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11047/500000] + train/ActionNoiseL2Loss=0.1028 + throughput/total_tokens=2,121,024,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11048/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=2,121,216,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11049/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=2,121,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11050/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=2,121,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11051/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=2,121,792,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11052/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=2,121,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11053/500000] + train/ActionNoiseL2Loss=0.0248 + throughput/total_tokens=2,122,176,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11054/500000] + train/ActionNoiseL2Loss=0.0792 + throughput/total_tokens=2,122,368,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11055/500000] + train/ActionNoiseL2Loss=0.0788 + throughput/total_tokens=2,122,560,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11056/500000] + train/ActionNoiseL2Loss=0.0722 + throughput/total_tokens=2,122,752,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11057/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=2,122,944,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11058/500000] + train/ActionNoiseL2Loss=0.1043 + throughput/total_tokens=2,123,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11059/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=2,123,328,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11060/500000] + optim/total_grad_norm=0.8191 + train/ActionNoiseL2Loss=0.0220 + throughput/total_tokens=2,123,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11061/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=2,123,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11062/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=2,123,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11063/500000] + train/ActionNoiseL2Loss=0.0388 + throughput/total_tokens=2,124,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11064/500000] + train/ActionNoiseL2Loss=0.1021 + throughput/total_tokens=2,124,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11065/500000] + train/ActionNoiseL2Loss=0.0355 + throughput/total_tokens=2,124,480,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11066/500000] + train/ActionNoiseL2Loss=0.0913 + throughput/total_tokens=2,124,672,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11067/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=2,124,864,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11068/500000] + train/ActionNoiseL2Loss=0.0702 + throughput/total_tokens=2,125,056,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11069/500000] + train/ActionNoiseL2Loss=0.1178 + throughput/total_tokens=2,125,248,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11070/500000] + train/ActionNoiseL2Loss=0.1119 + throughput/total_tokens=2,125,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=11071/500000] + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=2,125,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11072/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=2,125,824,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11073/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=2,126,016,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=11074/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=2,126,208,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=11075/500000] + train/ActionNoiseL2Loss=0.0361 + throughput/total_tokens=2,126,400,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=11076/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=2,126,592,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=11077/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=2,126,784,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=11078/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=2,126,976,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11079/500000] + train/ActionNoiseL2Loss=0.0296 + throughput/total_tokens=2,127,168,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11080/500000] + optim/total_grad_norm=1.151 + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=2,127,360,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=11081/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=2,127,552,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11082/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=2,127,744,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11083/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=2,127,936,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11084/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=2,128,128,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11085/500000] + train/ActionNoiseL2Loss=0.0294 + throughput/total_tokens=2,128,320,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11086/500000] + train/ActionNoiseL2Loss=0.0828 + throughput/total_tokens=2,128,512,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11087/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=2,128,704,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11088/500000] + train/ActionNoiseL2Loss=0.0334 + throughput/total_tokens=2,128,896,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11089/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=2,129,088,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11090/500000] + train/ActionNoiseL2Loss=0.0721 + throughput/total_tokens=2,129,280,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11091/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=2,129,472,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11092/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=2,129,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11093/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=2,129,856,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11094/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=2,130,048,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11095/500000] + train/ActionNoiseL2Loss=0.0246 + throughput/total_tokens=2,130,240,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11096/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=2,130,432,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11097/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=2,130,624,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11098/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=2,130,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11099/500000] + train/ActionNoiseL2Loss=0.0488 + throughput/total_tokens=2,131,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11100/500000] + optim/total_grad_norm=0.8895 + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=2,131,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11101/500000] + train/ActionNoiseL2Loss=0.1176 + throughput/total_tokens=2,131,392,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11102/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=2,131,584,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11103/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=2,131,776,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11104/500000] + train/ActionNoiseL2Loss=0.0858 + throughput/total_tokens=2,131,968,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11105/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=2,132,160,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11106/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=2,132,352,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11107/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=2,132,544,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11108/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=2,132,736,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11109/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=2,132,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11110/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=2,133,120,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11111/500000] + train/ActionNoiseL2Loss=0.0781 + throughput/total_tokens=2,133,312,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11112/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=2,133,504,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11113/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=2,133,696,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11114/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=2,133,888,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11115/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=2,134,080,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11116/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=2,134,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11117/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=2,134,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11118/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=2,134,656,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11119/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=2,134,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11120/500000] + optim/total_grad_norm=0.6427 + train/ActionNoiseL2Loss=0.0610 + throughput/total_tokens=2,135,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11121/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=2,135,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11122/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=2,135,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11123/500000] + train/ActionNoiseL2Loss=0.0509 + throughput/total_tokens=2,135,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11124/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=2,135,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11125/500000] + train/ActionNoiseL2Loss=0.0140 + throughput/total_tokens=2,136,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11126/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=2,136,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11127/500000] + train/ActionNoiseL2Loss=0.0302 + throughput/total_tokens=2,136,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11128/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=2,136,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11129/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=2,136,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11130/500000] + train/ActionNoiseL2Loss=0.0291 + throughput/total_tokens=2,136,960,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11131/500000] + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=2,137,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11132/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=2,137,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11133/500000] + train/ActionNoiseL2Loss=0.0393 + throughput/total_tokens=2,137,536,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11134/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=2,137,728,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11135/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=2,137,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11136/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=2,138,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11137/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=2,138,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11138/500000] + train/ActionNoiseL2Loss=0.0377 + throughput/total_tokens=2,138,496,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11139/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=2,138,688,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11140/500000] + optim/total_grad_norm=0.9201 + train/ActionNoiseL2Loss=0.1063 + throughput/total_tokens=2,138,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11141/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=2,139,072,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11142/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=2,139,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11143/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=2,139,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11144/500000] + train/ActionNoiseL2Loss=0.0268 + throughput/total_tokens=2,139,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11145/500000] + train/ActionNoiseL2Loss=0.0387 + throughput/total_tokens=2,139,840,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11146/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=2,140,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11147/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=2,140,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11148/500000] + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=2,140,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11149/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=2,140,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11150/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=2,140,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11151/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=2,140,992,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11152/500000] + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=2,141,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11153/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=2,141,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11154/500000] + train/ActionNoiseL2Loss=0.0346 + throughput/total_tokens=2,141,568,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11155/500000] + train/ActionNoiseL2Loss=0.0183 + throughput/total_tokens=2,141,760,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11156/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=2,141,952,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11157/500000] + train/ActionNoiseL2Loss=0.0388 + throughput/total_tokens=2,142,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11158/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=2,142,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11159/500000] + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=2,142,528,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11160/500000] + optim/total_grad_norm=0.6352 + train/ActionNoiseL2Loss=0.0248 + throughput/total_tokens=2,142,720,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11161/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=2,142,912,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11162/500000] + train/ActionNoiseL2Loss=0.0463 + throughput/total_tokens=2,143,104,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11163/500000] + train/ActionNoiseL2Loss=0.0259 + throughput/total_tokens=2,143,296,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11164/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=2,143,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11165/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=2,143,680,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11166/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=2,143,872,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11167/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=2,144,064,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11168/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=2,144,256,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11169/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=2,144,448,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11170/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=2,144,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11171/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=2,144,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11172/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=2,145,024,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11173/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=2,145,216,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11174/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=2,145,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11175/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=2,145,600,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11176/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=2,145,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11177/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=2,145,984,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11178/500000] + train/ActionNoiseL2Loss=0.0541 + throughput/total_tokens=2,146,176,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11179/500000] + train/ActionNoiseL2Loss=0.0275 + throughput/total_tokens=2,146,368,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11180/500000] + optim/total_grad_norm=0.5327 + train/ActionNoiseL2Loss=0.0417 + throughput/total_tokens=2,146,560,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11181/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=2,146,752,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11182/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=2,146,944,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11183/500000] + train/ActionNoiseL2Loss=0.0892 + throughput/total_tokens=2,147,136,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11184/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=2,147,328,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11185/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=2,147,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11186/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=2,147,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11187/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=2,147,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11188/500000] + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=2,148,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11189/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=2,148,288,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11190/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=2,148,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11191/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=2,148,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11192/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=2,148,864,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11193/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=2,149,056,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11194/500000] + train/ActionNoiseL2Loss=0.0932 + throughput/total_tokens=2,149,248,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11195/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=2,149,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11196/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=2,149,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11197/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=2,149,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11198/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=2,150,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11199/500000] + train/ActionNoiseL2Loss=0.0583 + throughput/total_tokens=2,150,208,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11200/500000] + optim/total_grad_norm=0.3373 + train/ActionNoiseL2Loss=0.0370 + throughput/total_tokens=2,150,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=11201/500000] + train/ActionNoiseL2Loss=0.0190 + throughput/total_tokens=2,150,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11202/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=2,150,784,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11203/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=2,150,976,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11204/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=2,151,168,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11205/500000] + train/ActionNoiseL2Loss=0.0647 + throughput/total_tokens=2,151,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11206/500000] + train/ActionNoiseL2Loss=0.1402 + throughput/total_tokens=2,151,552,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11207/500000] + train/ActionNoiseL2Loss=0.0309 + throughput/total_tokens=2,151,744,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11208/500000] + train/ActionNoiseL2Loss=0.0259 + throughput/total_tokens=2,151,936,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11209/500000] + train/ActionNoiseL2Loss=0.0427 + throughput/total_tokens=2,152,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11210/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=2,152,320,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11211/500000] + train/ActionNoiseL2Loss=0.0705 + throughput/total_tokens=2,152,512,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11212/500000] + train/ActionNoiseL2Loss=0.0198 + throughput/total_tokens=2,152,704,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11213/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=2,152,896,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11214/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=2,153,088,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11215/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=2,153,280,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11216/500000] + train/ActionNoiseL2Loss=0.0627 + throughput/total_tokens=2,153,472,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11217/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=2,153,664,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11218/500000] + train/ActionNoiseL2Loss=0.0801 + throughput/total_tokens=2,153,856,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11219/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=2,154,048,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11220/500000] + optim/total_grad_norm=0.9183 + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=2,154,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11221/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=2,154,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11222/500000] + train/ActionNoiseL2Loss=0.0735 + throughput/total_tokens=2,154,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11223/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=2,154,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11224/500000] + train/ActionNoiseL2Loss=0.0213 + throughput/total_tokens=2,155,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11225/500000] + train/ActionNoiseL2Loss=0.0795 + throughput/total_tokens=2,155,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11226/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=2,155,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11227/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=2,155,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11228/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=2,155,776,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11229/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=2,155,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11230/500000] + train/ActionNoiseL2Loss=0.1110 + throughput/total_tokens=2,156,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11231/500000] + train/ActionNoiseL2Loss=0.0220 + throughput/total_tokens=2,156,352,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11232/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=2,156,544,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11233/500000] + train/ActionNoiseL2Loss=0.0586 + throughput/total_tokens=2,156,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11234/500000] + train/ActionNoiseL2Loss=0.0881 + throughput/total_tokens=2,156,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11235/500000] + train/ActionNoiseL2Loss=0.0351 + throughput/total_tokens=2,157,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11236/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=2,157,312,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11237/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=2,157,504,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11238/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=2,157,696,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11239/500000] + train/ActionNoiseL2Loss=0.0951 + throughput/total_tokens=2,157,888,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11240/500000] + optim/total_grad_norm=0.7952 + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=2,158,080,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=11241/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=2,158,272,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11242/500000] + train/ActionNoiseL2Loss=0.0408 + throughput/total_tokens=2,158,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11243/500000] + train/ActionNoiseL2Loss=0.0701 + throughput/total_tokens=2,158,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11244/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=2,158,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11245/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=2,159,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11246/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=2,159,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11247/500000] + train/ActionNoiseL2Loss=0.0244 + throughput/total_tokens=2,159,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11248/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=2,159,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11249/500000] + train/ActionNoiseL2Loss=0.0261 + throughput/total_tokens=2,159,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11250/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=2,160,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11251/500000] + train/ActionNoiseL2Loss=0.0896 + throughput/total_tokens=2,160,192,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11252/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=2,160,384,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11253/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=2,160,576,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11254/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=2,160,768,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11255/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=2,160,960,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11256/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=2,161,152,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11257/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=2,161,344,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11258/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=2,161,536,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11259/500000] + train/ActionNoiseL2Loss=0.0794 + throughput/total_tokens=2,161,728,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11260/500000] + optim/total_grad_norm=0.6097 + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=2,161,920,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11261/500000] + train/ActionNoiseL2Loss=0.0791 + throughput/total_tokens=2,162,112,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11262/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=2,162,304,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11263/500000] + train/ActionNoiseL2Loss=0.0434 + throughput/total_tokens=2,162,496,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11264/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=2,162,688,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=11265/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=2,162,880,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=11266/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=2,163,072,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=11267/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=2,163,264,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=11268/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=2,163,456,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=11269/500000] + train/ActionNoiseL2Loss=0.0769 + throughput/total_tokens=2,163,648,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=11270/500000] + train/ActionNoiseL2Loss=0.0770 + throughput/total_tokens=2,163,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11271/500000] + train/ActionNoiseL2Loss=0.1159 + throughput/total_tokens=2,164,032,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11272/500000] + train/ActionNoiseL2Loss=0.0741 + throughput/total_tokens=2,164,224,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11273/500000] + train/ActionNoiseL2Loss=0.0218 + throughput/total_tokens=2,164,416,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11274/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=2,164,608,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11275/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=2,164,800,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11276/500000] + train/ActionNoiseL2Loss=0.0505 + throughput/total_tokens=2,164,992,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11277/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=2,165,184,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11278/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=2,165,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11279/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=2,165,568,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11280/500000] + optim/total_grad_norm=0.6491 + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=2,165,760,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11281/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=2,165,952,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11282/500000] + train/ActionNoiseL2Loss=0.0309 + throughput/total_tokens=2,166,144,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11283/500000] + train/ActionNoiseL2Loss=0.0548 + throughput/total_tokens=2,166,336,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11284/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=2,166,528,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11285/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=2,166,720,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11286/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=2,166,912,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11287/500000] + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=2,167,104,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11288/500000] + train/ActionNoiseL2Loss=0.0711 + throughput/total_tokens=2,167,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11289/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=2,167,488,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11290/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=2,167,680,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11291/500000] + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=2,167,872,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11292/500000] + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=2,168,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11293/500000] + train/ActionNoiseL2Loss=0.0280 + throughput/total_tokens=2,168,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11294/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=2,168,448,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11295/500000] + train/ActionNoiseL2Loss=0.0289 + throughput/total_tokens=2,168,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11296/500000] + train/ActionNoiseL2Loss=0.0307 + throughput/total_tokens=2,168,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11297/500000] + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=2,169,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11298/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=2,169,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11299/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=2,169,408,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11300/500000] + optim/total_grad_norm=0.5525 + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=2,169,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11301/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=2,169,792,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11302/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=2,169,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11303/500000] + train/ActionNoiseL2Loss=0.0310 + throughput/total_tokens=2,170,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11304/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=2,170,368,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11305/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=2,170,560,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11306/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=2,170,752,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11307/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=2,170,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11308/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=2,171,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11309/500000] + train/ActionNoiseL2Loss=0.0395 + throughput/total_tokens=2,171,328,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11310/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=2,171,520,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11311/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=2,171,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11312/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=2,171,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11313/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=2,172,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11314/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=2,172,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11315/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=2,172,480,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11316/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=2,172,672,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11317/500000] + train/ActionNoiseL2Loss=0.0641 + throughput/total_tokens=2,172,864,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11318/500000] + train/ActionNoiseL2Loss=0.0263 + throughput/total_tokens=2,173,056,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11319/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=2,173,248,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11320/500000] + optim/total_grad_norm=0.4942 + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=2,173,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11321/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=2,173,632,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11322/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=2,173,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11323/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=2,174,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11324/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=2,174,208,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11325/500000] + train/ActionNoiseL2Loss=0.0579 + throughput/total_tokens=2,174,400,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11326/500000] + train/ActionNoiseL2Loss=0.0690 + throughput/total_tokens=2,174,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11327/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=2,174,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11328/500000] + train/ActionNoiseL2Loss=0.1112 + throughput/total_tokens=2,174,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11329/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=2,175,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11330/500000] + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=2,175,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11331/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=2,175,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11332/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=2,175,744,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11333/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=2,175,936,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11334/500000] + train/ActionNoiseL2Loss=0.0995 + throughput/total_tokens=2,176,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11335/500000] + train/ActionNoiseL2Loss=0.0537 + throughput/total_tokens=2,176,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11336/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=2,176,512,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11337/500000] + train/ActionNoiseL2Loss=0.0679 + throughput/total_tokens=2,176,704,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11338/500000] + train/ActionNoiseL2Loss=0.0412 + throughput/total_tokens=2,176,896,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11339/500000] + train/ActionNoiseL2Loss=0.0291 + throughput/total_tokens=2,177,088,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11340/500000] + optim/total_grad_norm=0.9661 + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=2,177,280,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11341/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=2,177,472,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11342/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=2,177,664,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11343/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=2,177,856,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11344/500000] + train/ActionNoiseL2Loss=0.0430 + throughput/total_tokens=2,178,048,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11345/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=2,178,240,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11346/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=2,178,432,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11347/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=2,178,624,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11348/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=2,178,816,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11349/500000] + train/ActionNoiseL2Loss=0.0449 + throughput/total_tokens=2,179,008,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11350/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=2,179,200,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=11351/500000] + train/ActionNoiseL2Loss=0.0819 + throughput/total_tokens=2,179,392,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=11352/500000] + train/ActionNoiseL2Loss=0.0644 + throughput/total_tokens=2,179,584,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=11353/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=2,179,776,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=11354/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=2,179,968,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=11355/500000] + train/ActionNoiseL2Loss=0.0308 + throughput/total_tokens=2,180,160,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=11356/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=2,180,352,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=11357/500000] + train/ActionNoiseL2Loss=0.0263 + throughput/total_tokens=2,180,544,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=11358/500000] + train/ActionNoiseL2Loss=0.0178 + throughput/total_tokens=2,180,736,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=11359/500000] + train/ActionNoiseL2Loss=0.0635 + throughput/total_tokens=2,180,928,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=11360/500000] + optim/total_grad_norm=1.164 + train/ActionNoiseL2Loss=0.0861 + throughput/total_tokens=2,181,120,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=11361/500000] + train/ActionNoiseL2Loss=0.0967 + throughput/total_tokens=2,181,312,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=11362/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=2,181,504,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=11363/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=2,181,696,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=11364/500000] + train/ActionNoiseL2Loss=0.0559 + throughput/total_tokens=2,181,888,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0476 +[step=11365/500000] + train/ActionNoiseL2Loss=0.0955 + throughput/total_tokens=2,182,080,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=11366/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=2,182,272,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=11367/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=2,182,464,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11368/500000] + train/ActionNoiseL2Loss=0.0288 + throughput/total_tokens=2,182,656,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11369/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=2,182,848,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11370/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=2,183,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11371/500000] + train/ActionNoiseL2Loss=0.1043 + throughput/total_tokens=2,183,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11372/500000] + train/ActionNoiseL2Loss=0.0546 + throughput/total_tokens=2,183,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11373/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=2,183,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11374/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=2,183,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11375/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=2,184,000,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11376/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=2,184,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11377/500000] + train/ActionNoiseL2Loss=0.0190 + throughput/total_tokens=2,184,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11378/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=2,184,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11379/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=2,184,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11380/500000] + optim/total_grad_norm=0.7888 + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=2,184,960,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11381/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=2,185,152,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11382/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=2,185,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11383/500000] + train/ActionNoiseL2Loss=0.0305 + throughput/total_tokens=2,185,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11384/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=2,185,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11385/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=2,185,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11386/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=2,186,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11387/500000] + train/ActionNoiseL2Loss=0.1040 + throughput/total_tokens=2,186,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11388/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=2,186,496,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11389/500000] + train/ActionNoiseL2Loss=0.0716 + throughput/total_tokens=2,186,688,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11390/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=2,186,880,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11391/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=2,187,072,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11392/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=2,187,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11393/500000] + train/ActionNoiseL2Loss=0.0696 + throughput/total_tokens=2,187,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11394/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=2,187,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11395/500000] + train/ActionNoiseL2Loss=0.1194 + throughput/total_tokens=2,187,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11396/500000] + train/ActionNoiseL2Loss=0.0372 + throughput/total_tokens=2,188,032,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11397/500000] + train/ActionNoiseL2Loss=0.0264 + throughput/total_tokens=2,188,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11398/500000] + train/ActionNoiseL2Loss=0.0525 + throughput/total_tokens=2,188,416,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11399/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=2,188,608,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11400/500000] + optim/total_grad_norm=0.6577 + train/ActionNoiseL2Loss=0.0682 + throughput/total_tokens=2,188,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11401/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=2,188,992,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11402/500000] + train/ActionNoiseL2Loss=0.0689 + throughput/total_tokens=2,189,184,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11403/500000] + train/ActionNoiseL2Loss=0.0812 + throughput/total_tokens=2,189,376,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11404/500000] + train/ActionNoiseL2Loss=0.0645 + throughput/total_tokens=2,189,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11405/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=2,189,760,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11406/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=2,189,952,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11407/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=2,190,144,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11408/500000] + train/ActionNoiseL2Loss=0.0660 + throughput/total_tokens=2,190,336,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11409/500000] + train/ActionNoiseL2Loss=0.0361 + throughput/total_tokens=2,190,528,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11410/500000] + train/ActionNoiseL2Loss=0.0895 + throughput/total_tokens=2,190,720,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11411/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=2,190,912,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11412/500000] + train/ActionNoiseL2Loss=0.0407 + throughput/total_tokens=2,191,104,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11413/500000] + train/ActionNoiseL2Loss=0.0290 + throughput/total_tokens=2,191,296,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11414/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=2,191,488,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11415/500000] + train/ActionNoiseL2Loss=0.0640 + throughput/total_tokens=2,191,680,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11416/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=2,191,872,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11417/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=2,192,064,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11418/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=2,192,256,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11419/500000] + train/ActionNoiseL2Loss=0.0367 + throughput/total_tokens=2,192,448,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11420/500000] + optim/total_grad_norm=0.7718 + train/ActionNoiseL2Loss=0.0678 + throughput/total_tokens=2,192,640,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11421/500000] + train/ActionNoiseL2Loss=0.0487 + throughput/total_tokens=2,192,832,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11422/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=2,193,024,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11423/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=2,193,216,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11424/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=2,193,408,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11425/500000] + train/ActionNoiseL2Loss=0.0691 + throughput/total_tokens=2,193,600,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11426/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=2,193,792,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11427/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=2,193,984,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11428/500000] + train/ActionNoiseL2Loss=0.0598 + throughput/total_tokens=2,194,176,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11429/500000] + train/ActionNoiseL2Loss=0.0669 + throughput/total_tokens=2,194,368,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11430/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=2,194,560,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11431/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=2,194,752,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11432/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=2,194,944,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11433/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=2,195,136,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11434/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=2,195,328,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11435/500000] + train/ActionNoiseL2Loss=0.0526 + throughput/total_tokens=2,195,520,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11436/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=2,195,712,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11437/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=2,195,904,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11438/500000] + train/ActionNoiseL2Loss=0.0777 + throughput/total_tokens=2,196,096,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11439/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=2,196,288,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11440/500000] + optim/total_grad_norm=0.5449 + train/ActionNoiseL2Loss=0.0616 + throughput/total_tokens=2,196,480,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11441/500000] + train/ActionNoiseL2Loss=0.0655 + throughput/total_tokens=2,196,672,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11442/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=2,196,864,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11443/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=2,197,056,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11444/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=2,197,248,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11445/500000] + train/ActionNoiseL2Loss=0.0451 + throughput/total_tokens=2,197,440,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11446/500000] + train/ActionNoiseL2Loss=0.0318 + throughput/total_tokens=2,197,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11447/500000] + train/ActionNoiseL2Loss=0.0479 + throughput/total_tokens=2,197,824,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11448/500000] + train/ActionNoiseL2Loss=0.0404 + throughput/total_tokens=2,198,016,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11449/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=2,198,208,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11450/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=2,198,400,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11451/500000] + train/ActionNoiseL2Loss=0.0704 + throughput/total_tokens=2,198,592,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11452/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=2,198,784,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11453/500000] + train/ActionNoiseL2Loss=0.0628 + throughput/total_tokens=2,198,976,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11454/500000] + train/ActionNoiseL2Loss=0.0365 + throughput/total_tokens=2,199,168,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11455/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=2,199,360,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11456/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=2,199,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11457/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=2,199,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11458/500000] + train/ActionNoiseL2Loss=0.0852 + throughput/total_tokens=2,199,936,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11459/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=2,200,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11460/500000] + optim/total_grad_norm=0.7757 + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=2,200,320,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11461/500000] + train/ActionNoiseL2Loss=0.0591 + throughput/total_tokens=2,200,512,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11462/500000] + train/ActionNoiseL2Loss=0.0520 + throughput/total_tokens=2,200,704,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11463/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=2,200,896,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11464/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=2,201,088,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11465/500000] + train/ActionNoiseL2Loss=0.1139 + throughput/total_tokens=2,201,280,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11466/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=2,201,472,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11467/500000] + train/ActionNoiseL2Loss=0.0254 + throughput/total_tokens=2,201,664,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11468/500000] + train/ActionNoiseL2Loss=0.0321 + throughput/total_tokens=2,201,856,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11469/500000] + train/ActionNoiseL2Loss=0.0642 + throughput/total_tokens=2,202,048,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11470/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=2,202,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11471/500000] + train/ActionNoiseL2Loss=0.0504 + throughput/total_tokens=2,202,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11472/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=2,202,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11473/500000] + train/ActionNoiseL2Loss=0.0572 + throughput/total_tokens=2,202,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11474/500000] + train/ActionNoiseL2Loss=0.0714 + throughput/total_tokens=2,203,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11475/500000] + train/ActionNoiseL2Loss=0.0681 + throughput/total_tokens=2,203,200,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11476/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=2,203,392,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11477/500000] + train/ActionNoiseL2Loss=0.0531 + throughput/total_tokens=2,203,584,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11478/500000] + train/ActionNoiseL2Loss=0.0599 + throughput/total_tokens=2,203,776,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11479/500000] + train/ActionNoiseL2Loss=0.0280 + throughput/total_tokens=2,203,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11480/500000] + optim/total_grad_norm=0.6921 + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=2,204,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11481/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=2,204,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11482/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=2,204,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11483/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=2,204,736,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11484/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=2,204,928,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11485/500000] + train/ActionNoiseL2Loss=0.0311 + throughput/total_tokens=2,205,120,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11486/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=2,205,312,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11487/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=2,205,504,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11488/500000] + train/ActionNoiseL2Loss=0.0626 + throughput/total_tokens=2,205,696,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11489/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=2,205,888,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11490/500000] + train/ActionNoiseL2Loss=0.0854 + throughput/total_tokens=2,206,080,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11491/500000] + train/ActionNoiseL2Loss=0.0556 + throughput/total_tokens=2,206,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11492/500000] + train/ActionNoiseL2Loss=0.1011 + throughput/total_tokens=2,206,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11493/500000] + train/ActionNoiseL2Loss=0.0684 + throughput/total_tokens=2,206,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11494/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=2,206,848,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11495/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=2,207,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11496/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=2,207,232,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11497/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=2,207,424,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11498/500000] + train/ActionNoiseL2Loss=0.0803 + throughput/total_tokens=2,207,616,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11499/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=2,207,808,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11500/500000] + optim/total_grad_norm=0.8442 + train/ActionNoiseL2Loss=0.0665 + throughput/total_tokens=2,208,000,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +10/14 [13:16:01] INFO | >> Saving config... checkpoint.py:608 +10/14 [13:16:35] INFO | >> Saving model state... checkpoint.py:796 +10/14 [13:17:49] INFO | >> Saving optim state... checkpoint.py:811 +10/14 [13:19:31] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=11501/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=2,208,192,000 + throughput/device/tokens_per_second=1,137 + throughput/device/batches_per_second=0.0474 +[step=11502/500000] + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=2,208,384,000 + throughput/device/tokens_per_second=1,137 + throughput/device/batches_per_second=0.0474 +[step=11503/500000] + train/ActionNoiseL2Loss=0.0508 + throughput/total_tokens=2,208,576,000 + throughput/device/tokens_per_second=1,134 + throughput/device/batches_per_second=0.0473 +[step=11504/500000] + train/ActionNoiseL2Loss=0.0455 + throughput/total_tokens=2,208,768,000 + throughput/device/tokens_per_second=1,136 + throughput/device/batches_per_second=0.0474 +[step=11505/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=2,208,960,000 + throughput/device/tokens_per_second=1,139 + throughput/device/batches_per_second=0.0475 +[step=11506/500000] + train/ActionNoiseL2Loss=0.0917 + throughput/total_tokens=2,209,152,000 + throughput/device/tokens_per_second=1,141 + throughput/device/batches_per_second=0.0476 +[step=11507/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=2,209,344,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=11508/500000] + train/ActionNoiseL2Loss=0.0924 + throughput/total_tokens=2,209,536,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=11509/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=2,209,728,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=11510/500000] + train/ActionNoiseL2Loss=0.0363 + throughput/total_tokens=2,209,920,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=11511/500000] + train/ActionNoiseL2Loss=0.0331 + throughput/total_tokens=2,210,112,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=11512/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=2,210,304,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=11513/500000] + train/ActionNoiseL2Loss=0.0379 + throughput/total_tokens=2,210,496,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11514/500000] + train/ActionNoiseL2Loss=0.0436 + throughput/total_tokens=2,210,688,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11515/500000] + train/ActionNoiseL2Loss=0.0425 + throughput/total_tokens=2,210,880,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11516/500000] + train/ActionNoiseL2Loss=0.0274 + throughput/total_tokens=2,211,072,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11517/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=2,211,264,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11518/500000] + train/ActionNoiseL2Loss=0.0943 + throughput/total_tokens=2,211,456,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11519/500000] + train/ActionNoiseL2Loss=0.0614 + throughput/total_tokens=2,211,648,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11520/500000] + optim/total_grad_norm=0.7911 + train/ActionNoiseL2Loss=0.0361 + throughput/total_tokens=2,211,840,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=11521/500000] + train/ActionNoiseL2Loss=0.0686 + throughput/total_tokens=2,212,032,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11522/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=2,212,224,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11523/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=2,212,416,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11524/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=2,212,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11525/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=2,212,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11526/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=2,212,992,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11527/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=2,213,184,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11528/500000] + train/ActionNoiseL2Loss=0.0652 + throughput/total_tokens=2,213,376,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11529/500000] + train/ActionNoiseL2Loss=0.0438 + throughput/total_tokens=2,213,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11530/500000] + train/ActionNoiseL2Loss=0.0839 + throughput/total_tokens=2,213,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11531/500000] + train/ActionNoiseL2Loss=0.0445 + throughput/total_tokens=2,213,952,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11532/500000] + train/ActionNoiseL2Loss=0.0254 + throughput/total_tokens=2,214,144,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11533/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=2,214,336,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11534/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=2,214,528,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11535/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=2,214,720,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11536/500000] + train/ActionNoiseL2Loss=0.0330 + throughput/total_tokens=2,214,912,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11537/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=2,215,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11538/500000] + train/ActionNoiseL2Loss=0.0646 + throughput/total_tokens=2,215,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11539/500000] + train/ActionNoiseL2Loss=0.0623 + throughput/total_tokens=2,215,488,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11540/500000] + optim/total_grad_norm=0.5279 + train/ActionNoiseL2Loss=0.0524 + throughput/total_tokens=2,215,680,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=11541/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=2,215,872,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11542/500000] + train/ActionNoiseL2Loss=0.0256 + throughput/total_tokens=2,216,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11543/500000] + train/ActionNoiseL2Loss=0.0343 + throughput/total_tokens=2,216,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11544/500000] + train/ActionNoiseL2Loss=0.0960 + throughput/total_tokens=2,216,448,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11545/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=2,216,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11546/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=2,216,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11547/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=2,217,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11548/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=2,217,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11549/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=2,217,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11550/500000] + train/ActionNoiseL2Loss=0.0348 + throughput/total_tokens=2,217,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=11551/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=2,217,792,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11552/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=2,217,984,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11553/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=2,218,176,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11554/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=2,218,368,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11555/500000] + train/ActionNoiseL2Loss=0.0300 + throughput/total_tokens=2,218,560,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11556/500000] + train/ActionNoiseL2Loss=0.0333 + throughput/total_tokens=2,218,752,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11557/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=2,218,944,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11558/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=2,219,136,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11559/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=2,219,328,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11560/500000] + optim/total_grad_norm=0.7126 + train/ActionNoiseL2Loss=0.0435 + throughput/total_tokens=2,219,520,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=11561/500000] + train/ActionNoiseL2Loss=0.0581 + throughput/total_tokens=2,219,712,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11562/500000] + train/ActionNoiseL2Loss=0.0774 + throughput/total_tokens=2,219,904,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11563/500000] + train/ActionNoiseL2Loss=0.0804 + throughput/total_tokens=2,220,096,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11564/500000] + train/ActionNoiseL2Loss=0.0263 + throughput/total_tokens=2,220,288,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11565/500000] + train/ActionNoiseL2Loss=0.0573 + throughput/total_tokens=2,220,480,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11566/500000] + train/ActionNoiseL2Loss=0.0995 + throughput/total_tokens=2,220,672,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11567/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=2,220,864,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11568/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=2,221,056,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11569/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=2,221,248,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11570/500000] + train/ActionNoiseL2Loss=0.0452 + throughput/total_tokens=2,221,440,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11571/500000] + train/ActionNoiseL2Loss=0.0398 + throughput/total_tokens=2,221,632,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11572/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=2,221,824,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11573/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=2,222,016,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11574/500000] + train/ActionNoiseL2Loss=0.0297 + throughput/total_tokens=2,222,208,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11575/500000] + train/ActionNoiseL2Loss=0.0969 + throughput/total_tokens=2,222,400,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11576/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=2,222,592,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11577/500000] + train/ActionNoiseL2Loss=0.0303 + throughput/total_tokens=2,222,784,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11578/500000] + train/ActionNoiseL2Loss=0.0687 + throughput/total_tokens=2,222,976,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11579/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=2,223,168,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11580/500000] + optim/total_grad_norm=0.8734 + train/ActionNoiseL2Loss=0.0273 + throughput/total_tokens=2,223,360,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11581/500000] + train/ActionNoiseL2Loss=0.0670 + throughput/total_tokens=2,223,552,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11582/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=2,223,744,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11583/500000] + train/ActionNoiseL2Loss=0.0882 + throughput/total_tokens=2,223,936,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11584/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=2,224,128,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11585/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=2,224,320,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11586/500000] + train/ActionNoiseL2Loss=0.0602 + throughput/total_tokens=2,224,512,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11587/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=2,224,704,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11588/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=2,224,896,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11589/500000] + train/ActionNoiseL2Loss=0.0248 + throughput/total_tokens=2,225,088,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11590/500000] + train/ActionNoiseL2Loss=0.0920 + throughput/total_tokens=2,225,280,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11591/500000] + train/ActionNoiseL2Loss=0.0391 + throughput/total_tokens=2,225,472,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11592/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=2,225,664,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11593/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=2,225,856,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11594/500000] + train/ActionNoiseL2Loss=0.0595 + throughput/total_tokens=2,226,048,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11595/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=2,226,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11596/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=2,226,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11597/500000] + train/ActionNoiseL2Loss=0.0255 + throughput/total_tokens=2,226,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11598/500000] + train/ActionNoiseL2Loss=0.1325 + throughput/total_tokens=2,226,816,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11599/500000] + train/ActionNoiseL2Loss=0.0662 + throughput/total_tokens=2,227,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11600/500000] + optim/total_grad_norm=0.9487 + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=2,227,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11601/500000] + train/ActionNoiseL2Loss=0.0632 + throughput/total_tokens=2,227,392,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11602/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=2,227,584,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11603/500000] + train/ActionNoiseL2Loss=0.0907 + throughput/total_tokens=2,227,776,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11604/500000] + train/ActionNoiseL2Loss=0.0606 + throughput/total_tokens=2,227,968,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11605/500000] + train/ActionNoiseL2Loss=0.0275 + throughput/total_tokens=2,228,160,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11606/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=2,228,352,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11607/500000] + train/ActionNoiseL2Loss=0.0275 + throughput/total_tokens=2,228,544,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11608/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=2,228,736,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11609/500000] + train/ActionNoiseL2Loss=0.0349 + throughput/total_tokens=2,228,928,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11610/500000] + train/ActionNoiseL2Loss=0.0680 + throughput/total_tokens=2,229,120,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=11611/500000] + train/ActionNoiseL2Loss=0.0637 + throughput/total_tokens=2,229,312,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11612/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=2,229,504,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11613/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=2,229,696,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11614/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=2,229,888,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11615/500000] + train/ActionNoiseL2Loss=0.0974 + throughput/total_tokens=2,230,080,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11616/500000] + train/ActionNoiseL2Loss=0.0585 + throughput/total_tokens=2,230,272,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11617/500000] + train/ActionNoiseL2Loss=0.0958 + throughput/total_tokens=2,230,464,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11618/500000] + train/ActionNoiseL2Loss=0.0345 + throughput/total_tokens=2,230,656,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11619/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=2,230,848,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11620/500000] + optim/total_grad_norm=0.5555 + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=2,231,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11621/500000] + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=2,231,232,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11622/500000] + train/ActionNoiseL2Loss=0.0242 + throughput/total_tokens=2,231,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11623/500000] + train/ActionNoiseL2Loss=0.0422 + throughput/total_tokens=2,231,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11624/500000] + train/ActionNoiseL2Loss=0.0654 + throughput/total_tokens=2,231,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11625/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=2,232,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11626/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=2,232,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11627/500000] + train/ActionNoiseL2Loss=0.0502 + throughput/total_tokens=2,232,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11628/500000] + train/ActionNoiseL2Loss=0.0514 + throughput/total_tokens=2,232,576,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11629/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=2,232,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11630/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=2,232,960,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11631/500000] + train/ActionNoiseL2Loss=0.0401 + throughput/total_tokens=2,233,152,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11632/500000] + train/ActionNoiseL2Loss=0.0805 + throughput/total_tokens=2,233,344,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11633/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=2,233,536,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11634/500000] + train/ActionNoiseL2Loss=0.0737 + throughput/total_tokens=2,233,728,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11635/500000] + train/ActionNoiseL2Loss=0.0371 + throughput/total_tokens=2,233,920,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11636/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=2,234,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11637/500000] + train/ActionNoiseL2Loss=0.0323 + throughput/total_tokens=2,234,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11638/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=2,234,496,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11639/500000] + train/ActionNoiseL2Loss=0.1083 + throughput/total_tokens=2,234,688,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11640/500000] + optim/total_grad_norm=0.8047 + train/ActionNoiseL2Loss=0.0844 + throughput/total_tokens=2,234,880,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11641/500000] + train/ActionNoiseL2Loss=0.0549 + throughput/total_tokens=2,235,072,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11642/500000] + train/ActionNoiseL2Loss=0.0499 + throughput/total_tokens=2,235,264,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11643/500000] + train/ActionNoiseL2Loss=0.0786 + throughput/total_tokens=2,235,456,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11644/500000] + train/ActionNoiseL2Loss=0.0344 + throughput/total_tokens=2,235,648,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11645/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=2,235,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11646/500000] + train/ActionNoiseL2Loss=0.0251 + throughput/total_tokens=2,236,032,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11647/500000] + train/ActionNoiseL2Loss=0.0261 + throughput/total_tokens=2,236,224,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11648/500000] + train/ActionNoiseL2Loss=0.0793 + throughput/total_tokens=2,236,416,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11649/500000] + train/ActionNoiseL2Loss=0.1175 + throughput/total_tokens=2,236,608,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11650/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=2,236,800,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11651/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=2,236,992,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11652/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=2,237,184,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11653/500000] + train/ActionNoiseL2Loss=0.0589 + throughput/total_tokens=2,237,376,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11654/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=2,237,568,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11655/500000] + train/ActionNoiseL2Loss=0.0719 + throughput/total_tokens=2,237,760,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11656/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=2,237,952,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11657/500000] + train/ActionNoiseL2Loss=0.0855 + throughput/total_tokens=2,238,144,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11658/500000] + train/ActionNoiseL2Loss=0.0378 + throughput/total_tokens=2,238,336,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11659/500000] + train/ActionNoiseL2Loss=0.0292 + throughput/total_tokens=2,238,528,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=11660/500000] + optim/total_grad_norm=0.9711 + train/ActionNoiseL2Loss=0.1056 + throughput/total_tokens=2,238,720,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=11661/500000] + train/ActionNoiseL2Loss=0.0885 + throughput/total_tokens=2,238,912,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11662/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=2,239,104,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11663/500000] + train/ActionNoiseL2Loss=0.0561 + throughput/total_tokens=2,239,296,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11664/500000] + train/ActionNoiseL2Loss=0.0697 + throughput/total_tokens=2,239,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11665/500000] + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=2,239,680,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11666/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=2,239,872,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11667/500000] + train/ActionNoiseL2Loss=0.0554 + throughput/total_tokens=2,240,064,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11668/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=2,240,256,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11669/500000] + train/ActionNoiseL2Loss=0.0597 + throughput/total_tokens=2,240,448,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11670/500000] + train/ActionNoiseL2Loss=0.0895 + throughput/total_tokens=2,240,640,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11671/500000] + train/ActionNoiseL2Loss=0.0373 + throughput/total_tokens=2,240,832,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11672/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=2,241,024,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11673/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=2,241,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11674/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=2,241,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11675/500000] + train/ActionNoiseL2Loss=0.0496 + throughput/total_tokens=2,241,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11676/500000] + train/ActionNoiseL2Loss=0.0186 + throughput/total_tokens=2,241,792,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11677/500000] + train/ActionNoiseL2Loss=0.0649 + throughput/total_tokens=2,241,984,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11678/500000] + train/ActionNoiseL2Loss=0.0544 + throughput/total_tokens=2,242,176,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11679/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=2,242,368,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11680/500000] + optim/total_grad_norm=0.5772 + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=2,242,560,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11681/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=2,242,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11682/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=2,242,944,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11683/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=2,243,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11684/500000] + train/ActionNoiseL2Loss=0.0513 + throughput/total_tokens=2,243,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11685/500000] + train/ActionNoiseL2Loss=0.0750 + throughput/total_tokens=2,243,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11686/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=2,243,712,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11687/500000] + train/ActionNoiseL2Loss=0.0604 + throughput/total_tokens=2,243,904,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11688/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=2,244,096,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11689/500000] + train/ActionNoiseL2Loss=0.0515 + throughput/total_tokens=2,244,288,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11690/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=2,244,480,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11691/500000] + train/ActionNoiseL2Loss=0.0775 + throughput/total_tokens=2,244,672,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11692/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=2,244,864,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11693/500000] + train/ActionNoiseL2Loss=0.0533 + throughput/total_tokens=2,245,056,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11694/500000] + train/ActionNoiseL2Loss=0.0698 + throughput/total_tokens=2,245,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11695/500000] + train/ActionNoiseL2Loss=0.0477 + throughput/total_tokens=2,245,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11696/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=2,245,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11697/500000] + train/ActionNoiseL2Loss=0.0400 + throughput/total_tokens=2,245,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11698/500000] + train/ActionNoiseL2Loss=0.0723 + throughput/total_tokens=2,246,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11699/500000] + train/ActionNoiseL2Loss=0.0466 + throughput/total_tokens=2,246,208,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11700/500000] + optim/total_grad_norm=0.7707 + train/ActionNoiseL2Loss=0.0987 + throughput/total_tokens=2,246,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11701/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=2,246,592,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11702/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=2,246,784,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11703/500000] + train/ActionNoiseL2Loss=0.0260 + throughput/total_tokens=2,246,976,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11704/500000] + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=2,247,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11705/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=2,247,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11706/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=2,247,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11707/500000] + train/ActionNoiseL2Loss=0.0250 + throughput/total_tokens=2,247,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11708/500000] + train/ActionNoiseL2Loss=0.0592 + throughput/total_tokens=2,247,936,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11709/500000] + train/ActionNoiseL2Loss=0.0578 + throughput/total_tokens=2,248,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11710/500000] + train/ActionNoiseL2Loss=0.1134 + throughput/total_tokens=2,248,320,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11711/500000] + train/ActionNoiseL2Loss=0.0492 + throughput/total_tokens=2,248,512,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11712/500000] + train/ActionNoiseL2Loss=0.0853 + throughput/total_tokens=2,248,704,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11713/500000] + train/ActionNoiseL2Loss=0.0262 + throughput/total_tokens=2,248,896,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11714/500000] + train/ActionNoiseL2Loss=0.0944 + throughput/total_tokens=2,249,088,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11715/500000] + train/ActionNoiseL2Loss=0.0414 + throughput/total_tokens=2,249,280,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11716/500000] + train/ActionNoiseL2Loss=0.0134 + throughput/total_tokens=2,249,472,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11717/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=2,249,664,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11718/500000] + train/ActionNoiseL2Loss=0.0577 + throughput/total_tokens=2,249,856,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11719/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=2,250,048,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11720/500000] + optim/total_grad_norm=0.7022 + train/ActionNoiseL2Loss=0.0734 + throughput/total_tokens=2,250,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11721/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=2,250,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11722/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=2,250,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11723/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=2,250,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11724/500000] + train/ActionNoiseL2Loss=0.0762 + throughput/total_tokens=2,251,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11725/500000] + train/ActionNoiseL2Loss=0.0381 + throughput/total_tokens=2,251,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11726/500000] + train/ActionNoiseL2Loss=0.0728 + throughput/total_tokens=2,251,392,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11727/500000] + train/ActionNoiseL2Loss=0.0383 + throughput/total_tokens=2,251,584,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11728/500000] + train/ActionNoiseL2Loss=0.0266 + throughput/total_tokens=2,251,776,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11729/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=2,251,968,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11730/500000] + train/ActionNoiseL2Loss=0.0317 + throughput/total_tokens=2,252,160,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11731/500000] + train/ActionNoiseL2Loss=0.0594 + throughput/total_tokens=2,252,352,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11732/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=2,252,544,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11733/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=2,252,736,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11734/500000] + train/ActionNoiseL2Loss=0.1034 + throughput/total_tokens=2,252,928,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11735/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=2,253,120,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11736/500000] + train/ActionNoiseL2Loss=0.0489 + throughput/total_tokens=2,253,312,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11737/500000] + train/ActionNoiseL2Loss=0.0403 + throughput/total_tokens=2,253,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11738/500000] + train/ActionNoiseL2Loss=0.0651 + throughput/total_tokens=2,253,696,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11739/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=2,253,888,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11740/500000] + optim/total_grad_norm=0.4144 + train/ActionNoiseL2Loss=0.0336 + throughput/total_tokens=2,254,080,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11741/500000] + train/ActionNoiseL2Loss=0.0503 + throughput/total_tokens=2,254,272,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11742/500000] + train/ActionNoiseL2Loss=0.0376 + throughput/total_tokens=2,254,464,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11743/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=2,254,656,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11744/500000] + train/ActionNoiseL2Loss=0.0364 + throughput/total_tokens=2,254,848,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11745/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=2,255,040,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11746/500000] + train/ActionNoiseL2Loss=0.0390 + throughput/total_tokens=2,255,232,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11747/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=2,255,424,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11748/500000] + train/ActionNoiseL2Loss=0.0661 + throughput/total_tokens=2,255,616,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11749/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=2,255,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11750/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=2,256,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11751/500000] + train/ActionNoiseL2Loss=0.0304 + throughput/total_tokens=2,256,192,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11752/500000] + train/ActionNoiseL2Loss=0.0552 + throughput/total_tokens=2,256,384,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11753/500000] + train/ActionNoiseL2Loss=0.0580 + throughput/total_tokens=2,256,576,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11754/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=2,256,768,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11755/500000] + train/ActionNoiseL2Loss=0.0347 + throughput/total_tokens=2,256,960,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11756/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=2,257,152,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11757/500000] + train/ActionNoiseL2Loss=0.0439 + throughput/total_tokens=2,257,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11758/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=2,257,536,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11759/500000] + train/ActionNoiseL2Loss=0.0290 + throughput/total_tokens=2,257,728,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11760/500000] + optim/total_grad_norm=0.6299 + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=2,257,920,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11761/500000] + train/ActionNoiseL2Loss=0.0954 + throughput/total_tokens=2,258,112,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11762/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=2,258,304,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11763/500000] + train/ActionNoiseL2Loss=0.0408 + throughput/total_tokens=2,258,496,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11764/500000] + train/ActionNoiseL2Loss=0.0454 + throughput/total_tokens=2,258,688,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11765/500000] + train/ActionNoiseL2Loss=0.0208 + throughput/total_tokens=2,258,880,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11766/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=2,259,072,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11767/500000] + train/ActionNoiseL2Loss=0.0447 + throughput/total_tokens=2,259,264,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11768/500000] + train/ActionNoiseL2Loss=0.0529 + throughput/total_tokens=2,259,456,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=11769/500000] + train/ActionNoiseL2Loss=0.0612 + throughput/total_tokens=2,259,648,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=11770/500000] + train/ActionNoiseL2Loss=0.0375 + throughput/total_tokens=2,259,840,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11771/500000] + train/ActionNoiseL2Loss=0.0938 + throughput/total_tokens=2,260,032,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11772/500000] + train/ActionNoiseL2Loss=0.0469 + throughput/total_tokens=2,260,224,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11773/500000] + train/ActionNoiseL2Loss=0.0636 + throughput/total_tokens=2,260,416,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11774/500000] + train/ActionNoiseL2Loss=0.0308 + throughput/total_tokens=2,260,608,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11775/500000] + train/ActionNoiseL2Loss=0.0388 + throughput/total_tokens=2,260,800,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11776/500000] + train/ActionNoiseL2Loss=0.0473 + throughput/total_tokens=2,260,992,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11777/500000] + train/ActionNoiseL2Loss=0.1091 + throughput/total_tokens=2,261,184,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11778/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=2,261,376,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11779/500000] + train/ActionNoiseL2Loss=0.0429 + throughput/total_tokens=2,261,568,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11780/500000] + optim/total_grad_norm=0.8650 + train/ActionNoiseL2Loss=0.0493 + throughput/total_tokens=2,261,760,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11781/500000] + train/ActionNoiseL2Loss=0.0708 + throughput/total_tokens=2,261,952,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11782/500000] + train/ActionNoiseL2Loss=0.0374 + throughput/total_tokens=2,262,144,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11783/500000] + train/ActionNoiseL2Loss=0.0332 + throughput/total_tokens=2,262,336,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11784/500000] + train/ActionNoiseL2Loss=0.0245 + throughput/total_tokens=2,262,528,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11785/500000] + train/ActionNoiseL2Loss=0.1107 + throughput/total_tokens=2,262,720,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11786/500000] + train/ActionNoiseL2Loss=0.0528 + throughput/total_tokens=2,262,912,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11787/500000] + train/ActionNoiseL2Loss=0.0848 + throughput/total_tokens=2,263,104,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11788/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=2,263,296,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11789/500000] + train/ActionNoiseL2Loss=0.0484 + throughput/total_tokens=2,263,488,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11790/500000] + train/ActionNoiseL2Loss=0.1034 + throughput/total_tokens=2,263,680,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11791/500000] + train/ActionNoiseL2Loss=0.0510 + throughput/total_tokens=2,263,872,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11792/500000] + train/ActionNoiseL2Loss=0.0613 + throughput/total_tokens=2,264,064,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11793/500000] + train/ActionNoiseL2Loss=0.0633 + throughput/total_tokens=2,264,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11794/500000] + train/ActionNoiseL2Loss=0.0380 + throughput/total_tokens=2,264,448,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11795/500000] + train/ActionNoiseL2Loss=0.1061 + throughput/total_tokens=2,264,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11796/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=2,264,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11797/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=2,265,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11798/500000] + train/ActionNoiseL2Loss=0.0536 + throughput/total_tokens=2,265,216,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11799/500000] + train/ActionNoiseL2Loss=0.0460 + throughput/total_tokens=2,265,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11800/500000] + optim/total_grad_norm=0.7516 + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=2,265,600,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=11801/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=2,265,792,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11802/500000] + train/ActionNoiseL2Loss=0.0507 + throughput/total_tokens=2,265,984,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11803/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=2,266,176,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11804/500000] + train/ActionNoiseL2Loss=0.0456 + throughput/total_tokens=2,266,368,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11805/500000] + train/ActionNoiseL2Loss=0.0382 + throughput/total_tokens=2,266,560,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11806/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=2,266,752,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11807/500000] + train/ActionNoiseL2Loss=0.0355 + throughput/total_tokens=2,266,944,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11808/500000] + train/ActionNoiseL2Loss=0.0575 + throughput/total_tokens=2,267,136,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11809/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=2,267,328,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=11810/500000] + train/ActionNoiseL2Loss=0.0485 + throughput/total_tokens=2,267,520,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11811/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=2,267,712,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11812/500000] + train/ActionNoiseL2Loss=0.0482 + throughput/total_tokens=2,267,904,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11813/500000] + train/ActionNoiseL2Loss=0.1161 + throughput/total_tokens=2,268,096,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11814/500000] + train/ActionNoiseL2Loss=0.0441 + throughput/total_tokens=2,268,288,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11815/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=2,268,480,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11816/500000] + train/ActionNoiseL2Loss=0.0495 + throughput/total_tokens=2,268,672,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11817/500000] + train/ActionNoiseL2Loss=0.1043 + throughput/total_tokens=2,268,864,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11818/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=2,269,056,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11819/500000] + train/ActionNoiseL2Loss=0.0280 + throughput/total_tokens=2,269,248,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11820/500000] + optim/total_grad_norm=0.8780 + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=2,269,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11821/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=2,269,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11822/500000] + train/ActionNoiseL2Loss=0.0350 + throughput/total_tokens=2,269,824,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11823/500000] + train/ActionNoiseL2Loss=0.0535 + throughput/total_tokens=2,270,016,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11824/500000] + train/ActionNoiseL2Loss=0.0713 + throughput/total_tokens=2,270,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11825/500000] + train/ActionNoiseL2Loss=0.0462 + throughput/total_tokens=2,270,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11826/500000] + train/ActionNoiseL2Loss=0.0742 + throughput/total_tokens=2,270,592,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11827/500000] + train/ActionNoiseL2Loss=0.0543 + throughput/total_tokens=2,270,784,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11828/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=2,270,976,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11829/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=2,271,168,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11830/500000] + train/ActionNoiseL2Loss=0.0356 + throughput/total_tokens=2,271,360,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11831/500000] + train/ActionNoiseL2Loss=0.0424 + throughput/total_tokens=2,271,552,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11832/500000] + train/ActionNoiseL2Loss=0.0754 + throughput/total_tokens=2,271,744,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11833/500000] + train/ActionNoiseL2Loss=0.0553 + throughput/total_tokens=2,271,936,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11834/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=2,272,128,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11835/500000] + train/ActionNoiseL2Loss=0.0810 + throughput/total_tokens=2,272,320,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11836/500000] + train/ActionNoiseL2Loss=0.0676 + throughput/total_tokens=2,272,512,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11837/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=2,272,704,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11838/500000] + train/ActionNoiseL2Loss=0.0428 + throughput/total_tokens=2,272,896,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11839/500000] + train/ActionNoiseL2Loss=0.0630 + throughput/total_tokens=2,273,088,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11840/500000] + optim/total_grad_norm=0.7621 + train/ActionNoiseL2Loss=0.0782 + throughput/total_tokens=2,273,280,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=11841/500000] + train/ActionNoiseL2Loss=0.0830 + throughput/total_tokens=2,273,472,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11842/500000] + train/ActionNoiseL2Loss=0.0331 + throughput/total_tokens=2,273,664,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11843/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=2,273,856,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11844/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=2,274,048,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11845/500000] + train/ActionNoiseL2Loss=0.0521 + throughput/total_tokens=2,274,240,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11846/500000] + train/ActionNoiseL2Loss=0.1096 + throughput/total_tokens=2,274,432,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11847/500000] + train/ActionNoiseL2Loss=0.0420 + throughput/total_tokens=2,274,624,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11848/500000] + train/ActionNoiseL2Loss=0.0596 + throughput/total_tokens=2,274,816,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11849/500000] + train/ActionNoiseL2Loss=0.0431 + throughput/total_tokens=2,275,008,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11850/500000] + train/ActionNoiseL2Loss=0.0653 + throughput/total_tokens=2,275,200,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=11851/500000] + train/ActionNoiseL2Loss=0.0352 + throughput/total_tokens=2,275,392,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11852/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=2,275,584,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11853/500000] + train/ActionNoiseL2Loss=0.0368 + throughput/total_tokens=2,275,776,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11854/500000] + train/ActionNoiseL2Loss=0.0291 + throughput/total_tokens=2,275,968,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11855/500000] + train/ActionNoiseL2Loss=0.0329 + throughput/total_tokens=2,276,160,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11856/500000] + train/ActionNoiseL2Loss=0.0673 + throughput/total_tokens=2,276,352,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11857/500000] + train/ActionNoiseL2Loss=0.0622 + throughput/total_tokens=2,276,544,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11858/500000] + train/ActionNoiseL2Loss=0.0272 + throughput/total_tokens=2,276,736,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11859/500000] + train/ActionNoiseL2Loss=0.0416 + throughput/total_tokens=2,276,928,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11860/500000] + optim/total_grad_norm=0.7575 + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=2,277,120,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=11861/500000] + train/ActionNoiseL2Loss=0.0475 + throughput/total_tokens=2,277,312,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=11862/500000] + train/ActionNoiseL2Loss=0.1004 + throughput/total_tokens=2,277,504,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11863/500000] + train/ActionNoiseL2Loss=0.0817 + throughput/total_tokens=2,277,696,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11864/500000] + train/ActionNoiseL2Loss=0.1321 + throughput/total_tokens=2,277,888,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11865/500000] + train/ActionNoiseL2Loss=0.0634 + throughput/total_tokens=2,278,080,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11866/500000] + train/ActionNoiseL2Loss=0.0564 + throughput/total_tokens=2,278,272,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11867/500000] + train/ActionNoiseL2Loss=0.0478 + throughput/total_tokens=2,278,464,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11868/500000] + train/ActionNoiseL2Loss=0.0667 + throughput/total_tokens=2,278,656,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11869/500000] + train/ActionNoiseL2Loss=0.0320 + throughput/total_tokens=2,278,848,000 + throughput/device/tokens_per_second=1,144 + throughput/device/batches_per_second=0.0477 +[step=11870/500000] + train/ActionNoiseL2Loss=0.0771 + throughput/total_tokens=2,279,040,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11871/500000] + train/ActionNoiseL2Loss=0.0311 + throughput/total_tokens=2,279,232,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11872/500000] + train/ActionNoiseL2Loss=0.0799 + throughput/total_tokens=2,279,424,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11873/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=2,279,616,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=11874/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=2,279,808,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11875/500000] + train/ActionNoiseL2Loss=0.0816 + throughput/total_tokens=2,280,000,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11876/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=2,280,192,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11877/500000] + train/ActionNoiseL2Loss=0.0729 + throughput/total_tokens=2,280,384,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11878/500000] + train/ActionNoiseL2Loss=0.0797 + throughput/total_tokens=2,280,576,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11879/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=2,280,768,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11880/500000] + optim/total_grad_norm=0.6628 + train/ActionNoiseL2Loss=0.0624 + throughput/total_tokens=2,280,960,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11881/500000] + train/ActionNoiseL2Loss=0.0342 + throughput/total_tokens=2,281,152,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11882/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=2,281,344,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11883/500000] + train/ActionNoiseL2Loss=0.0530 + throughput/total_tokens=2,281,536,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11884/500000] + train/ActionNoiseL2Loss=0.0829 + throughput/total_tokens=2,281,728,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11885/500000] + train/ActionNoiseL2Loss=0.0480 + throughput/total_tokens=2,281,920,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11886/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=2,282,112,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11887/500000] + train/ActionNoiseL2Loss=0.0282 + throughput/total_tokens=2,282,304,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11888/500000] + train/ActionNoiseL2Loss=0.0498 + throughput/total_tokens=2,282,496,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11889/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=2,282,688,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11890/500000] + train/ActionNoiseL2Loss=0.0899 + throughput/total_tokens=2,282,880,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11891/500000] + train/ActionNoiseL2Loss=0.0567 + throughput/total_tokens=2,283,072,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11892/500000] + train/ActionNoiseL2Loss=0.0453 + throughput/total_tokens=2,283,264,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11893/500000] + train/ActionNoiseL2Loss=0.1110 + throughput/total_tokens=2,283,456,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11894/500000] + train/ActionNoiseL2Loss=0.0361 + throughput/total_tokens=2,283,648,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11895/500000] + train/ActionNoiseL2Loss=0.0826 + throughput/total_tokens=2,283,840,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11896/500000] + train/ActionNoiseL2Loss=0.0116 + throughput/total_tokens=2,284,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11897/500000] + train/ActionNoiseL2Loss=0.0934 + throughput/total_tokens=2,284,224,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11898/500000] + train/ActionNoiseL2Loss=0.0639 + throughput/total_tokens=2,284,416,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11899/500000] + train/ActionNoiseL2Loss=0.0468 + throughput/total_tokens=2,284,608,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11900/500000] + optim/total_grad_norm=0.8190 + train/ActionNoiseL2Loss=0.0783 + throughput/total_tokens=2,284,800,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11901/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=2,284,992,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11902/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=2,285,184,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11903/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=2,285,376,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11904/500000] + train/ActionNoiseL2Loss=0.0574 + throughput/total_tokens=2,285,568,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11905/500000] + train/ActionNoiseL2Loss=0.0178 + throughput/total_tokens=2,285,760,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11906/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=2,285,952,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11907/500000] + train/ActionNoiseL2Loss=0.0566 + throughput/total_tokens=2,286,144,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11908/500000] + train/ActionNoiseL2Loss=0.0916 + throughput/total_tokens=2,286,336,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11909/500000] + train/ActionNoiseL2Loss=0.0784 + throughput/total_tokens=2,286,528,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11910/500000] + train/ActionNoiseL2Loss=0.0672 + throughput/total_tokens=2,286,720,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=11911/500000] + train/ActionNoiseL2Loss=0.0691 + throughput/total_tokens=2,286,912,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11912/500000] + train/ActionNoiseL2Loss=0.0442 + throughput/total_tokens=2,287,104,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11913/500000] + train/ActionNoiseL2Loss=0.0643 + throughput/total_tokens=2,287,296,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11914/500000] + train/ActionNoiseL2Loss=0.0825 + throughput/total_tokens=2,287,488,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11915/500000] + train/ActionNoiseL2Loss=0.0718 + throughput/total_tokens=2,287,680,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11916/500000] + train/ActionNoiseL2Loss=0.0418 + throughput/total_tokens=2,287,872,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11917/500000] + train/ActionNoiseL2Loss=0.0279 + throughput/total_tokens=2,288,064,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11918/500000] + train/ActionNoiseL2Loss=0.0410 + throughput/total_tokens=2,288,256,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11919/500000] + train/ActionNoiseL2Loss=0.0683 + throughput/total_tokens=2,288,448,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11920/500000] + optim/total_grad_norm=0.5774 + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=2,288,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11921/500000] + train/ActionNoiseL2Loss=0.0695 + throughput/total_tokens=2,288,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11922/500000] + train/ActionNoiseL2Loss=0.0545 + throughput/total_tokens=2,289,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11923/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=2,289,216,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11924/500000] + train/ActionNoiseL2Loss=0.0302 + throughput/total_tokens=2,289,408,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11925/500000] + train/ActionNoiseL2Loss=0.0747 + throughput/total_tokens=2,289,600,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11926/500000] + train/ActionNoiseL2Loss=0.0873 + throughput/total_tokens=2,289,792,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11927/500000] + train/ActionNoiseL2Loss=0.0500 + throughput/total_tokens=2,289,984,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11928/500000] + train/ActionNoiseL2Loss=0.0615 + throughput/total_tokens=2,290,176,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11929/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=2,290,368,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11930/500000] + train/ActionNoiseL2Loss=0.0257 + throughput/total_tokens=2,290,560,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11931/500000] + train/ActionNoiseL2Loss=0.0746 + throughput/total_tokens=2,290,752,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11932/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=2,290,944,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11933/500000] + train/ActionNoiseL2Loss=0.0432 + throughput/total_tokens=2,291,136,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11934/500000] + train/ActionNoiseL2Loss=0.0787 + throughput/total_tokens=2,291,328,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11935/500000] + train/ActionNoiseL2Loss=0.0222 + throughput/total_tokens=2,291,520,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11936/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=2,291,712,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11937/500000] + train/ActionNoiseL2Loss=0.0406 + throughput/total_tokens=2,291,904,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11938/500000] + train/ActionNoiseL2Loss=0.0353 + throughput/total_tokens=2,292,096,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11939/500000] + train/ActionNoiseL2Loss=0.0666 + throughput/total_tokens=2,292,288,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11940/500000] + optim/total_grad_norm=0.6962 + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=2,292,480,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=11941/500000] + train/ActionNoiseL2Loss=0.0764 + throughput/total_tokens=2,292,672,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11942/500000] + train/ActionNoiseL2Loss=0.0443 + throughput/total_tokens=2,292,864,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11943/500000] + train/ActionNoiseL2Loss=0.1079 + throughput/total_tokens=2,293,056,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11944/500000] + train/ActionNoiseL2Loss=0.0216 + throughput/total_tokens=2,293,248,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11945/500000] + train/ActionNoiseL2Loss=0.0699 + throughput/total_tokens=2,293,440,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11946/500000] + train/ActionNoiseL2Loss=0.0789 + throughput/total_tokens=2,293,632,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11947/500000] + train/ActionNoiseL2Loss=0.0571 + throughput/total_tokens=2,293,824,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11948/500000] + train/ActionNoiseL2Loss=0.0519 + throughput/total_tokens=2,294,016,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11949/500000] + train/ActionNoiseL2Loss=0.0444 + throughput/total_tokens=2,294,208,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11950/500000] + train/ActionNoiseL2Loss=0.0668 + throughput/total_tokens=2,294,400,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11951/500000] + train/ActionNoiseL2Loss=0.0370 + throughput/total_tokens=2,294,592,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=11952/500000] + train/ActionNoiseL2Loss=0.0459 + throughput/total_tokens=2,294,784,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11953/500000] + train/ActionNoiseL2Loss=0.0471 + throughput/total_tokens=2,294,976,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11954/500000] + train/ActionNoiseL2Loss=0.0308 + throughput/total_tokens=2,295,168,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11955/500000] + train/ActionNoiseL2Loss=0.0939 + throughput/total_tokens=2,295,360,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11956/500000] + train/ActionNoiseL2Loss=0.0538 + throughput/total_tokens=2,295,552,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11957/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=2,295,744,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11958/500000] + train/ActionNoiseL2Loss=0.0187 + throughput/total_tokens=2,295,936,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11959/500000] + train/ActionNoiseL2Loss=0.0562 + throughput/total_tokens=2,296,128,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11960/500000] + optim/total_grad_norm=0.5270 + train/ActionNoiseL2Loss=0.0410 + throughput/total_tokens=2,296,320,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 + System/Peak GPU Memory (MB)=51,076 +[step=11961/500000] + train/ActionNoiseL2Loss=0.0490 + throughput/total_tokens=2,296,512,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=11962/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=2,296,704,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11963/500000] + train/ActionNoiseL2Loss=0.0433 + throughput/total_tokens=2,296,896,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11964/500000] + train/ActionNoiseL2Loss=0.0461 + throughput/total_tokens=2,297,088,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11965/500000] + train/ActionNoiseL2Loss=0.0518 + throughput/total_tokens=2,297,280,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11966/500000] + train/ActionNoiseL2Loss=0.0491 + throughput/total_tokens=2,297,472,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11967/500000] + train/ActionNoiseL2Loss=0.0516 + throughput/total_tokens=2,297,664,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11968/500000] + train/ActionNoiseL2Loss=0.0557 + throughput/total_tokens=2,297,856,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11969/500000] + train/ActionNoiseL2Loss=0.0260 + throughput/total_tokens=2,298,048,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=11970/500000] + train/ActionNoiseL2Loss=0.0659 + throughput/total_tokens=2,298,240,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11971/500000] + train/ActionNoiseL2Loss=0.0423 + throughput/total_tokens=2,298,432,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11972/500000] + train/ActionNoiseL2Loss=0.0486 + throughput/total_tokens=2,298,624,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11973/500000] + train/ActionNoiseL2Loss=0.0752 + throughput/total_tokens=2,298,816,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11974/500000] + train/ActionNoiseL2Loss=0.0384 + throughput/total_tokens=2,299,008,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=11975/500000] + train/ActionNoiseL2Loss=0.0605 + throughput/total_tokens=2,299,200,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11976/500000] + train/ActionNoiseL2Loss=0.0550 + throughput/total_tokens=2,299,392,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11977/500000] + train/ActionNoiseL2Loss=0.0245 + throughput/total_tokens=2,299,584,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11978/500000] + train/ActionNoiseL2Loss=0.0440 + throughput/total_tokens=2,299,776,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11979/500000] + train/ActionNoiseL2Loss=0.0966 + throughput/total_tokens=2,299,968,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11980/500000] + optim/total_grad_norm=0.7311 + train/ActionNoiseL2Loss=0.0527 + throughput/total_tokens=2,300,160,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=11981/500000] + train/ActionNoiseL2Loss=0.0707 + throughput/total_tokens=2,300,352,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11982/500000] + train/ActionNoiseL2Loss=0.0517 + throughput/total_tokens=2,300,544,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11983/500000] + train/ActionNoiseL2Loss=0.0413 + throughput/total_tokens=2,300,736,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11984/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=2,300,928,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11985/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=2,301,120,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11986/500000] + train/ActionNoiseL2Loss=0.0542 + throughput/total_tokens=2,301,312,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11987/500000] + train/ActionNoiseL2Loss=0.0399 + throughput/total_tokens=2,301,504,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11988/500000] + train/ActionNoiseL2Loss=0.0619 + throughput/total_tokens=2,301,696,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11989/500000] + train/ActionNoiseL2Loss=0.0842 + throughput/total_tokens=2,301,888,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11990/500000] + train/ActionNoiseL2Loss=0.0402 + throughput/total_tokens=2,302,080,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=11991/500000] + train/ActionNoiseL2Loss=0.0608 + throughput/total_tokens=2,302,272,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11992/500000] + train/ActionNoiseL2Loss=0.0340 + throughput/total_tokens=2,302,464,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11993/500000] + train/ActionNoiseL2Loss=0.0685 + throughput/total_tokens=2,302,656,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11994/500000] + train/ActionNoiseL2Loss=0.0560 + throughput/total_tokens=2,302,848,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=11995/500000] + train/ActionNoiseL2Loss=0.0448 + throughput/total_tokens=2,303,040,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11996/500000] + train/ActionNoiseL2Loss=0.1253 + throughput/total_tokens=2,303,232,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=11997/500000] + train/ActionNoiseL2Loss=0.0465 + throughput/total_tokens=2,303,424,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11998/500000] + train/ActionNoiseL2Loss=0.0362 + throughput/total_tokens=2,303,616,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=11999/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=2,303,808,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=12000/500000] + optim/total_grad_norm=0.7311 + train/ActionNoiseL2Loss=0.0576 + throughput/total_tokens=2,304,000,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +10/14 [16:15:03] INFO | >> Saving config... checkpoint.py:608 +10/14 [16:15:46] INFO | >> Saving model state... checkpoint.py:796 +10/14 [16:16:59] INFO | >> Saving optim state... checkpoint.py:811 +10/14 [16:18:25] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=12001/500000] + train/ActionNoiseL2Loss=0.0512 + throughput/total_tokens=2,304,192,000 + throughput/device/tokens_per_second=1,140 + throughput/device/batches_per_second=0.0475 +[step=12002/500000] + train/ActionNoiseL2Loss=0.0511 + throughput/total_tokens=2,304,384,000 + throughput/device/tokens_per_second=1,137 + throughput/device/batches_per_second=0.0474 +[step=12003/500000] + train/ActionNoiseL2Loss=0.0415 + throughput/total_tokens=2,304,576,000 + throughput/device/tokens_per_second=1,138 + throughput/device/batches_per_second=0.0474 +[step=12004/500000] + train/ActionNoiseL2Loss=0.0396 + throughput/total_tokens=2,304,768,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=12005/500000] + train/ActionNoiseL2Loss=0.0370 + throughput/total_tokens=2,304,960,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=12006/500000] + train/ActionNoiseL2Loss=0.0841 + throughput/total_tokens=2,305,152,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=12007/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=2,305,344,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=12008/500000] + train/ActionNoiseL2Loss=0.0450 + throughput/total_tokens=2,305,536,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=12009/500000] + train/ActionNoiseL2Loss=0.1049 + throughput/total_tokens=2,305,728,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=12010/500000] + train/ActionNoiseL2Loss=0.0470 + throughput/total_tokens=2,305,920,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 + System/Peak GPU Memory (MB)=51,076 +[step=12011/500000] + train/ActionNoiseL2Loss=0.0600 + throughput/total_tokens=2,306,112,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=12012/500000] + train/ActionNoiseL2Loss=0.0625 + throughput/total_tokens=2,306,304,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0478 +[step=12013/500000] + train/ActionNoiseL2Loss=0.0658 + throughput/total_tokens=2,306,496,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=12014/500000] + train/ActionNoiseL2Loss=0.0751 + throughput/total_tokens=2,306,688,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=12015/500000] + train/ActionNoiseL2Loss=0.0650 + throughput/total_tokens=2,306,880,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 +[step=12016/500000] + train/ActionNoiseL2Loss=0.1071 + throughput/total_tokens=2,307,072,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=12017/500000] + train/ActionNoiseL2Loss=0.0582 + throughput/total_tokens=2,307,264,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=12018/500000] + train/ActionNoiseL2Loss=0.0897 + throughput/total_tokens=2,307,456,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=12019/500000] + train/ActionNoiseL2Loss=0.0464 + throughput/total_tokens=2,307,648,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=12020/500000] + optim/total_grad_norm=1.110 + train/ActionNoiseL2Loss=0.0837 + throughput/total_tokens=2,307,840,000 + throughput/device/tokens_per_second=1,148 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=12021/500000] + train/ActionNoiseL2Loss=0.0558 + throughput/total_tokens=2,308,032,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=12022/500000] + train/ActionNoiseL2Loss=0.0405 + throughput/total_tokens=2,308,224,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=12023/500000] + train/ActionNoiseL2Loss=0.0955 + throughput/total_tokens=2,308,416,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=12024/500000] + train/ActionNoiseL2Loss=0.0671 + throughput/total_tokens=2,308,608,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=12025/500000] + train/ActionNoiseL2Loss=0.0203 + throughput/total_tokens=2,308,800,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=12026/500000] + train/ActionNoiseL2Loss=0.0457 + throughput/total_tokens=2,308,992,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=12027/500000] + train/ActionNoiseL2Loss=0.0663 + throughput/total_tokens=2,309,184,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=12028/500000] + train/ActionNoiseL2Loss=0.0426 + throughput/total_tokens=2,309,376,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=12029/500000] + train/ActionNoiseL2Loss=0.0565 + throughput/total_tokens=2,309,568,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=12030/500000] + train/ActionNoiseL2Loss=0.0621 + throughput/total_tokens=2,309,760,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=12031/500000] + train/ActionNoiseL2Loss=0.0730 + throughput/total_tokens=2,309,952,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=12032/500000] + train/ActionNoiseL2Loss=0.0522 + throughput/total_tokens=2,310,144,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=12033/500000] + train/ActionNoiseL2Loss=0.1143 + throughput/total_tokens=2,310,336,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=12034/500000] + train/ActionNoiseL2Loss=0.0609 + throughput/total_tokens=2,310,528,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=12035/500000] + train/ActionNoiseL2Loss=0.0590 + throughput/total_tokens=2,310,720,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=12036/500000] + train/ActionNoiseL2Loss=0.0360 + throughput/total_tokens=2,310,912,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=12037/500000] + train/ActionNoiseL2Loss=0.0601 + throughput/total_tokens=2,311,104,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=12038/500000] + train/ActionNoiseL2Loss=0.0629 + throughput/total_tokens=2,311,296,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=12039/500000] + train/ActionNoiseL2Loss=0.0501 + throughput/total_tokens=2,311,488,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=12040/500000] + optim/total_grad_norm=0.8040 + train/ActionNoiseL2Loss=0.0481 + throughput/total_tokens=2,311,680,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 + System/Peak GPU Memory (MB)=51,076 +[step=12041/500000] + train/ActionNoiseL2Loss=0.0617 + throughput/total_tokens=2,311,872,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=12042/500000] + train/ActionNoiseL2Loss=0.0709 + throughput/total_tokens=2,312,064,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=12043/500000] + train/ActionNoiseL2Loss=0.0675 + throughput/total_tokens=2,312,256,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=12044/500000] + train/ActionNoiseL2Loss=0.0419 + throughput/total_tokens=2,312,448,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=12045/500000] + train/ActionNoiseL2Loss=0.0409 + throughput/total_tokens=2,312,640,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=12046/500000] + train/ActionNoiseL2Loss=0.0523 + throughput/total_tokens=2,312,832,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=12047/500000] + train/ActionNoiseL2Loss=0.0563 + throughput/total_tokens=2,313,024,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0480 +[step=12048/500000] + train/ActionNoiseL2Loss=0.0540 + throughput/total_tokens=2,313,216,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=12049/500000] + train/ActionNoiseL2Loss=0.0568 + throughput/total_tokens=2,313,408,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=12050/500000] + train/ActionNoiseL2Loss=0.0587 + throughput/total_tokens=2,313,600,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=51,076 +[step=12051/500000] + train/ActionNoiseL2Loss=0.0355 + throughput/total_tokens=2,313,792,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=12052/500000] + train/ActionNoiseL2Loss=0.0224 + throughput/total_tokens=2,313,984,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 +[step=12053/500000] + train/ActionNoiseL2Loss=0.0593 + throughput/total_tokens=2,314,176,000 + throughput/device/tokens_per_second=1,146 + throughput/device/batches_per_second=0.0478 diff --git a/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/files/requirements.txt b/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/files/requirements.txt new file mode 100644 index 0000000000000000000000000000000000000000..5a5e971a5d9f3b6f6a75248e203682c5fbcd69e8 --- /dev/null +++ b/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/files/requirements.txt @@ -0,0 +1,286 @@ +ai2-molmo==0.0.0 +astunparse==1.6.3 +flatbuffers==25.2.10 +gast==0.6.0 +google-pasta==0.2.0 +h5py==3.14.0 +libclang==18.1.1 +Markdown==3.9 +namex==0.1.0 +opt_einsum==3.4.0 +optree==0.17.0 +tensorboard-data-server==0.7.2 +tensorflow-io-gcs-filesystem==0.37.1 +termcolor==3.1.0 +Werkzeug==3.1.3 +Brotli==1.1.0 +Farama-Notifications==0.0.4 +MarkupSafe==2.1.5 +PyYAML==6.0.2 +absl-py==2.3.1 +accelerate==1.10.1 +ai2-molmo==0.0.0 +aiofiles==24.1.0 +aiohappyeyeballs==2.6.1 +aiohttp==3.12.15 +aiosignal==1.4.0 +annotated-types==0.7.0 +antlr4-python3-runtime==4.9.3 +anyio==4.10.0 +array_record==0.8.1 +async-timeout==5.0.1 +attrs==25.3.0 +av==15.1.0 +backports.tarfile==1.2.0 +beaker-gantry==3.2.0 +beaker-py==2.5.0 +black==23.12.1 +blinker==1.9.0 +boltons==25.0.0 +boto3==1.40.33 +botocore==1.40.33 +build==1.3.0 +cached_path==1.7.3 +cached-property==2.0.1 +cachetools==5.5.2 +certifi==2025.8.3 +cffi==2.0.0 +charset-normalizer==3.4.3 +click==8.2.1 +click-help-colors==0.9.4 +click-option-group==0.5.7 +cloudpickle==3.1.1 +cmake==4.1.0 +contourpy==1.3.2 +cryptography==46.0.1 +cycler==0.12.1 +dataclass-extensions==0.2.3 +datasets==3.6.0 +decorator==5.2.1 +deepdiff==8.6.1 +diffusers==0.35.1 +dill==0.3.8 +distro==1.9.0 +dlimp==0.0.1 +dm-tree==0.1.9 +docutils==0.22.1 +draccus==0.10.0 +editdistance==0.8.1 +einops==0.8.1 +einops-exts==0.0.4 +et_xmlfile==2.0.0 +etils==1.13.0 +evdev==1.9.2 +exceptiongroup==1.3.0 +face==24.0.0 +fastapi==0.116.2 +ffmpy==0.6.1 +fiddle==0.3.0 +filelock==3.13.1 +Flask==3.1.2 +fonttools==4.60.0 +frozenlist==1.7.0 +fsspec==2023.9.2 +ftfy==6.3.1 +gcsfs==2023.9.2 +gitdb==4.0.12 +GitPython==3.1.45 +glom==24.11.0 +google-api-core==2.25.1 +google-auth==2.40.3 +google-auth-oauthlib==1.2.2 +google-cloud-core==2.4.3 +google-cloud-storage==2.19.0 +google-crc32c==1.7.1 +google-resumable-media==2.7.2 +googleapis-common-protos==1.70.0 +gradio==5.46.0 +gradio_client==1.13.0 +graphviz==0.21 +groovy==0.1.2 +grpcio==1.75.0 +gymnasium==0.29.1 +h11==0.16.0 +hf_transfer==0.1.9 +hf-xet==1.1.10 +httpcore==1.0.9 +httpx==0.28.1 +huggingface-hub==0.35.0 +id==1.5.0 +idna==3.10 +imageio==2.37.0 +imageio-ffmpeg==0.6.0 +importlib_metadata==8.7.0 +importlib_resources==6.5.2 +iniconfig==2.1.0 +inquirerpy==0.3.4 +isort==5.12.0 +itsdangerous==2.2.0 +jaraco.classes==3.4.0 +jaraco.context==6.0.1 +jaraco.functools==4.3.0 +jeepney==0.9.0 +Jinja2==3.1.4 +jiter==0.11.0 +jmespath==1.0.1 +joblib==1.5.2 +jsonlines==4.0.0 +keras==2.15.0 +keyring==25.6.0 +kiwisolver==1.4.9 +latex2sympy2_extended==1.10.2 +lerobot==0.3.4 +Levenshtein==0.27.1 +libcst==1.8.4 +lightning-utilities==0.15.2 +markdown-it-py==4.0.0 +math-verify==0.8.0 +matplotlib==3.10.6 +mdurl==0.1.2 +mergedeep==1.3.4 +ml-dtypes==0.2.0 +ml_dtypes==0.5.3 +more-itertools==10.8.0 +mpmath==1.3.0 +msgspec==0.19.0 +multidict==6.6.4 +multiprocess==0.70.16 +mypy==1.3.0 +mypy_extensions==1.1.0 +necessary==0.4.3 +networkx==3.3 +nh3==0.3.0 +nltk==3.9.1 +numpy==1.26.4 +oauthlib==3.3.1 +omegaconf==2.3.0 +openai==1.108.0 +opencv-python-headless==4.12.0.88 +OpenEXR==3.4.0 +openpyxl==3.1.5 +orderly-set==5.5.0 +orjson==3.11.3 +packaging==25.0 +pandas==2.3.2 +pathspec==0.12.1 +petname==2.6 +pfzy==0.3.4 +pillow==11.0.0 +pip==25.2 +platformdirs==4.4.0 +pluggy==1.6.0 +promise==2.3 +prompt_toolkit==3.0.52 +propcache==0.3.2 +proto-plus==1.26.1 +protobuf==4.21.12 +protobuf==6.32.1 +psutil==7.1.0 +pyarrow==21.0.0 +pyasn1==0.6.1 +pyasn1_modules==0.4.2 +pycparser==2.23 +pydantic==2.11.9 +pydantic_core==2.33.2 +pydub==0.25.1 +Pygments==2.19.2 +pynput==1.8.1 +pyparsing==3.2.4 +pyproject_hooks==1.2.0 +pyserial==3.5 +pytest==8.4.2 +pytest-sphinx==0.6.3 +python-dateutil==2.9.0.post0 +python-Levenshtein==0.27.1 +python-multipart==0.0.20 +python-xlib==0.33 +pytorch-triton-rocm==3.4.0 +pytz==2025.2 +pyyaml-include==1.4.1 +RapidFuzz==3.14.1 +readme_renderer==44.0 +regex==2025.9.1 +requests==2.32.5 +requests-oauthlib==2.0.0 +requests-toolbelt==1.0.0 +requirements-parser==0.13.0 +rerun-sdk==0.22.1 +rfc3986==2.0.0 +rich==13.9.4 +rsa==4.9.1 +ruff==0.13.0 +s3transfer==0.14.0 +safehttpx==0.1.6 +safetensors==0.6.2 +scikit-learn==1.7.2 +scipy==1.15.3 +SecretStorage==3.4.0 +semantic-version==2.10.0 +sentencepiece==0.2.1 +sentry-sdk==2.38.0 +setuptools==78.1.1 +shellingham==1.5.4 +six==1.17.0 +smart_open==7.3.1 +smashed==0.21.5 +smmap==5.0.2 +sniffio==1.3.1 +starlette==0.48.0 +sympy==1.13.3 +tensorboard==2.15.2 +tensorboard==2.19.0 +tensorflow==2.15.0 +tensorflow-addons==0.23.0 +tensorflow-datasets==4.9.3 +tensorflow-estimator==2.15.0 +tensorflow-graphics==2021.12.3 +tensorflow-metadata==1.17.2 +threadpoolctl==3.6.0 +timm==1.0.19 +tokenizers==0.22.0 +toml==0.10.2 +tomli==2.2.1 +tomlkit==0.13.3 +torch==2.8.0+rocm6.4 +torchcodec==0.5 +torchmetrics==1.8.2 +torchvision==0.23.0+rocm6.4 +tqdm==4.67.1 +transformers==4.56.1 +trimesh==4.8.2 +trouting==0.3.3 +twine==6.2.0 +typeguard==2.13.3 +typer==0.17.4 +typing_extensions==4.15.0 +typing-inspect==0.9.0 +typing-inspection==0.4.1 +tzdata==2025.2 +urllib3==2.5.0 +uvicorn==0.35.0 +wandb==0.21.4 +wcwidth==0.2.13 +websockets==15.0.1 +wheel==0.45.1 +wrapt==1.14.2 +xxhash==3.5.0 +yarl==1.20.1 +zipp==3.23.0 +lerobot==0.3.4 +minLoRA==0.1.0 +autocommand==2.2.2 +backports.tarfile==1.2.0 +importlib_metadata==8.0.0 +inflect==7.3.1 +jaraco.collections==5.1.0 +jaraco.context==5.3.0 +jaraco.functools==4.0.1 +jaraco.text==3.12.1 +more-itertools==10.3.0 +packaging==24.2 +platformdirs==4.2.2 +tomli==2.0.1 +typeguard==4.3.0 +typing_extensions==4.12.2 +wheel==0.45.1 +zipp==3.19.2 diff --git a/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/files/wandb-metadata.json b/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/files/wandb-metadata.json new file mode 100644 index 0000000000000000000000000000000000000000..2278b193e1c0c898d53b7cab833683683ba21e52 --- /dev/null +++ b/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/files/wandb-metadata.json @@ -0,0 +1,204 @@ +{ + "os": "Linux-5.15.0-140-generic-x86_64-with-glibc2.35", + "python": "CPython 3.10.18", + "startedAt": "2025-10-11T16:38:32.322236Z", + "args": [ + "qwen2_7b", + "save_folder=/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/eraser_flow_matching", + "--vision_backbone", + "openai", + "--action_head", + "flow_matching", + "--seq_len", + "1600", + "--ft_llm", + "--checkpoint", + "/vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924", + "--device_train_microbatch_size", + "16", + "--global_batch_size", + "126", + "--dataset", + "vla_dataset_realworld", + "--llm_learning_rate", + "5e-5", + "--wandb_entity", + "henryeap", + "--wandb_project", + "a1-realworld", + "--wandb_run_name", + "eraser", + "--real_world_vla_config_path", + "vla_config_realworld/vla_config_eraser.yaml", + "--save_overwrite" + ], + "program": "/vast/users/xiaodan/zhangjian/A1/launch_scripts/train_vla.py", + "codePath": "launch_scripts/train_vla.py", + "codePathLocal": "launch_scripts/train_vla.py", + "git": { + "remote": "https://github.com/Spatialtemporal-AI/A1.git", + "commit": "7c171df5d31577ede69d05172c2bc62d42ef3e3d" + }, + "email": "ihenrykwok@outlook.com", + "root": "/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/ckpt/eraser_flow_matching/wandb", + "host": "auh7-1b-gpu-257", + "executable": "/vast/users/xiaodan/miniconda3/envs/a1/bin/python3.10", + "cpu_count": 64, + "cpu_count_logical": 128, + "gpu": "Instinct MI210", + "gpu_count": 8, + "disk": { + "/": { + "total": "470343073792", + "used": "50676125696" + } + }, + "memory": { + "total": "2434606948352" + }, + "gpu_amd": [ + { + "id": "2", + "uniqueId": "0xf4493c96c09744d2", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "0", + "uniqueId": "0xb58c29a4c3c6588f", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "5", + "uniqueId": "0xb4e5eead729ba9d9", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "4", + "uniqueId": "0xeaac05cb926cff2", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "6", + "uniqueId": "0x4e7b2e0611069bd3", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "1", + "uniqueId": "0x755e5351c843dd85", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "7", + "uniqueId": "0x44a666bd7780e4c9", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + }, + { + "id": "3", + "uniqueId": "0xfa9e3533bde0bfe9", + "vbiosVersion": "113-D67301V-073", + "performanceLevel": "auto", + "maxPower": "300.0", + "series": "Instinct MI210", + "model": "0x740f", + "vendor": "Advanced Micro Devices, Inc. [AMD/ATI]", + "sku": "D67301V", + "sclkRange": "500Mhz - 1700Mhz", + "mclkRange": "400Mhz - 1600Mhz" + } + ], + "slurm": { + "cluster_name": "ai-04r", + "conf": "/etc/slurm/slurm.conf", + "cpus_on_node": "128", + "gpus_on_node": "8", + "gtids": "0", + "job_account": "faculty-acc", + "job_cpus_per_node": "128", + "job_end_time": "1760459846", + "job_gid": "2000", + "job_gpus": "0,1,2,3,4,5,6,7", + "job_id": "2285", + "job_name": "mh_eraser_flow_matching", + "job_nodelist": "auh7-1b-gpu-257", + "job_num_nodes": "1", + "job_partition": "faculty", + "job_qos": "xdqos", + "job_start_time": "1760200646", + "job_uid": "2013", + "job_user": "xiaodan", + "jobid": "2285", + "localid": "0", + "nnodes": "1", + "nodeid": "0", + "nodelist": "auh7-1b-gpu-257", + "nprocs": "1", + "ntasks": "1", + "ntasks_per_node": "1", + "oom_kill_step": "0", + "prio_process": "0", + "procid": "0", + "submit_dir": "/vast/users/xiaodan/zhangjian/A1/launch_scripts", + "submit_host": "auh-1b-cpu-login-001", + "task_pid": "1750364", + "tasks_per_node": "1", + "topology_addr": "auh7-1b-gpu-257", + "topology_addr_pattern": "node" + }, + "writerId": "sxmo78yvkkswxzfrthx903hv3at8k5qs" +} \ No newline at end of file diff --git a/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/logs/debug-core.log b/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/logs/debug-core.log new file mode 100644 index 0000000000000000000000000000000000000000..06fb9c280a2cdb22c2a96028d860cba17b2ca1a9 --- /dev/null +++ b/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/logs/debug-core.log @@ -0,0 +1,6 @@ +{"time":"2025-10-11T16:38:32.482685689Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmph9e5w27q/port-1750558.txt","pid":1750558,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false} +{"time":"2025-10-11T16:38:32.483185518Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":1750558} +{"time":"2025-10-11T16:38:32.483127687Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-1750558-1750735-1843609952/socket","Net":"unix"}} +{"time":"2025-10-11T16:38:32.571104464Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"} +{"time":"2025-10-11T16:38:32.584015164Z","level":"INFO","msg":"handleInformInit: received","streamId":"yqnt28c8","id":"1(@)"} +{"time":"2025-10-11T16:38:33.732937724Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"yqnt28c8","id":"1(@)"} diff --git a/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/logs/debug-internal.log b/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/logs/debug-internal.log new file mode 100644 index 0000000000000000000000000000000000000000..eb290784ac6ab6aaf91849ad696f7d4596c50668 --- /dev/null +++ b/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/logs/debug-internal.log @@ -0,0 +1,8 @@ +{"time":"2025-10-11T16:38:32.587302182Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"} +{"time":"2025-10-11T16:38:33.732885593Z","level":"INFO","msg":"stream: created new stream","id":"yqnt28c8"} +{"time":"2025-10-11T16:38:33.732932354Z","level":"INFO","msg":"stream: started","id":"yqnt28c8"} +{"time":"2025-10-11T16:38:33.732959824Z","level":"INFO","msg":"writer: started","stream_id":"yqnt28c8"} +{"time":"2025-10-11T16:38:33.732985135Z","level":"INFO","msg":"handler: started","stream_id":"yqnt28c8"} +{"time":"2025-10-11T16:38:33.732961384Z","level":"INFO","msg":"sender: started","stream_id":"yqnt28c8"} +{"time":"2025-10-13T08:15:22.219814038Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"} +{"time":"2025-10-13T20:01:35.03758236Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded"} diff --git a/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/logs/debug.log b/eraser_flow_matching/wandb/wandb/run-20251011_163832-yqnt28c8/logs/debug.log new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/eraser_l1_regression/step11500-action-head/metadata.pt b/eraser_l1_regression/step11500-action-head/metadata.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcf35cc50d811be8391b077330fc58f140a6565a --- /dev/null +++ b/eraser_l1_regression/step11500-action-head/metadata.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f3468869fca8c228cf940661de292bc786f2b18fa96d39a892606183f8dd9c0 +size 1331 diff --git a/eraser_l1_regression/step12000-action-head/metadata.pt b/eraser_l1_regression/step12000-action-head/metadata.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd2f224af58612b62d81033fb0bfb23b0ab41a53 --- /dev/null +++ b/eraser_l1_regression/step12000-action-head/metadata.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:620f952d81c645b6e811733acfcda83cb57d683353c484746edb322f5094c21e +size 1331 diff --git a/eraser_l1_regression/step12000-unsharded/train.pt b/eraser_l1_regression/step12000-unsharded/train.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca237da6c1bf73d685cde208eb4a25bcd504e7b7 --- /dev/null +++ b/eraser_l1_regression/step12000-unsharded/train.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a02ede2a3914fb17fda60a58b2ed5b3b8ea62b93ffa5f482bdd9f5e2b83a5cde +size 15061 diff --git a/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/files/output.log b/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/files/output.log new file mode 100644 index 0000000000000000000000000000000000000000..0eaaf4b7425bbb98fd41df64b704e1e97e8875b0 --- /dev/null +++ b/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/files/output.log @@ -0,0 +1,64022 @@ +wandb: Detected [openai] in use. +wandb: Use W&B Weave for improved LLM call tracing. Install Weave with `pip install weave` then add `import weave` to the top of your script. +wandb: For more information, check out the docs at: https://weave-docs.wandb.ai/ +10/11 [16:38:47] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109 + device id is provided via `init_process_group` or `barrier `. Using the current device set by the user. + warnings.warn( # warn only once + +****** vla_cfg: {'datasets': {'rlds': {'name': None, 'path': None, 'weight': 1.0, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [['/vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Eraser', 8, 'bounds']], 'open-source-real-world': {'rlds': {'name': 'a1_real_world', 'path': '/vast/users/xiaodan/zhangjian/datasets/OXE', 'weight': 8, 'action_proprio_normalization_type': 'bounds_q99', 'image_augmentation': False}, 'lerobot': [], 'agibot': {'path': None, 'weight': 8, 'action_proprio_normalization_type': None}}}, 'model': {'action_head': {'action_dim': 16, 'proprio_dim': 16, 'num_actions_chunk': 8, 'action_tokens_mapping': {'left_end_effector': 8, 'right_end_effector': 8}, 'use_left_eef': True, 'use_mobile_base': False}}} +****** Skip RLDS main; path not found: None +****** start build LeRobot main... +build_tokenizer, cache_dir None tokenizer_dir None +10/11 [16:38:49] INFO | >> Padding tokenizer with 418 tokens tokenizer.py:130 + INFO | >> Loading train dataset: vla_dataset_realworld/train __init__.py:438 +****** before LeRobot dataset... +****** data_config.rlds_data_root_dir: /vast/users/xiaodan/workspace/minghao.guo/warehouse_a1/dataset/realworld/Lerobot_Eraser +camera_keys: ['image', 'hand_left_image', 'hand_right_image'], state_key: state, action_key: actions +****** length of the dataset: 13441 +10/11 [16:38:51] INFO | >> build_rlds_train_dataset: Loading train dataset: vla_dataset_realworld/train __init__.py:521 +****** Import RLDSBatchTransform, RLDSDataset successfully. +****** before RLDS dataset... +****** data_config.rlds_dataset_name: a1_real_world +****** data_config.rlds_data_root_dir: /vast/users/xiaodan/zhangjian/datasets/OXE +214************** +10/11 [16:38:52] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/fractal20220817_data/0.1.0/dataset_statistics_138513de447c9e5435c5a12cc1c4a3c6a6434524fbd28f4 + 5463261fac12cf3fb.json. +214************** +10/11 [16:38:53] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/jaco_play/0.1.0/dataset_statistics_e081d4716a3da95df91c79d661ae59fa26a43da49db4bf8d716b622b56 + 3b0ea3.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/berkeley_cable_routing/0.1.0/dataset_statistics_08cb4c5b7c5e6c035fc84ea85b2d54c0c46ad608a8763 + 4ebb18374088d23cd76.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/viola/0.1.0/dataset_statistics_2415d8f7de73c8761fedd7c2a9590667fb0d3fdd26664bf4c100222e5cdb89 + b9.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/berkeley_autolab_ur5/0.1.0/dataset_statistics_1b798b015e7b2c4e4396719e3aa4d43a2f400b2edf5dbb0 + 820cb3df6943d8ddc.json. +214************** +10/11 [16:38:54] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/austin_buds_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_ccecde24cc01793b221 + 4eb0c4c5d7cc0e3ccc623db99bd892b83552b20decfb7.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/nyu_franka_play_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_b0d79557eac3059 + ebf9f679a8f044bd60403f0cba16a37e0df2fe1654416ffe7.json. +214************** +10/11 [16:38:55] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/furniture_bench_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_76735bab3752978 + bef83e1341d3c8db0a0d5a10397247eb3e0459388dccfe698.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/austin_sailor_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_4127c515a9413766f + e40ac696d884550bc655a40952ef3ae457c404d31570123.json. +214************** +10/11 [16:38:56] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/austin_sirius_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_cb2e0273f80029a19 + dc3dbb3a3a4118a5598e7bff3ff0245891255825b04b42a.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/dlr_edan_shared_control_converted_externally_to_rlds/0.1.0/dataset_statistics_b8984563fc3e7ea + c0803c667ef58c9deaf2e747683568306ea1d83505d532a76.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/utaustin_mutex/0.1.0/dataset_statistics_0a99ee5a8ce4a34ba018a7c0c742a1b74ab7abb7d7a3925f8596a + 3fc4eb8efc7.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/berkeley_fanuc_manipulation/0.1.0/dataset_statistics_a98d349d0364668095ea3ca38c6785e94f35e5e5 + 8e234c88fac83775a923b0d0.json. +214************** +10/11 [16:38:57] INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/bc_z/0.1.0/dataset_statistics_8187209d5cb273687cc8666697219dae50914ae2bee7f03552bd85a91fcfe7a + 4.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/roboturk/0.1.0/dataset_statistics_3aa821e17a2937f941d4102cfadcb1154853cb45dcec07ccc66893b01f6 + f1b40.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/toto/0.1.0/dataset_statistics_505a51eb76e85fe0969e8e70e45fb8c9ae5d3b1fae2851c7899bea91f74b979 + 0.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/ucsd_kitchen_dataset_converted_externally_to_rlds/0.1.0/dataset_statistics_1f1a5f310a2d5a6edc + 0e217370e135c8c8598290f11f57025037adcb0d033926.json. +214************** + INFO | >> [*] Loading existing dataset statistics from data_utils.py:200 + /vast/users/xiaodan/zhangjian/datasets/OXE/iamlab_cmu_pickup_insert_converted_externally_to_rlds/0.1.0/dataset_statistics_698a1f892f8866 + af9cb4bd5a23611fa44d8c7d9d816f9b3049d2fc3b62442079.json. + +###################################################################################### +# Loading the following 18 datasets (incl. sampling weight): # +# fractal20220817_data: ====================================================0.529250 # +# jaco_play: ===============================================================0.010898 # +# berkeley_cable_routing: ==================================================0.005916 # +# viola: ===================================================================0.021337 # +# berkeley_autolab_ur5: ====================================================0.027379 # +# austin_buds_dataset_converted_externally_to_rlds: ========================0.004768 # +# nyu_franka_play_dataset_converted_externally_to_rlds: ====================0.018817 # +# furniture_bench_dataset_converted_externally_to_rlds: ====================0.055185 # +# austin_sailor_dataset_converted_externally_to_rlds: ======================0.049354 # +# austin_sirius_dataset_converted_externally_to_rlds: ======================0.039129 # +# dlr_edan_shared_control_converted_externally_to_rlds: ====================0.001248 # +# utaustin_mutex: ==========================================================0.050583 # +# berkeley_fanuc_manipulation: =============================================0.017504 # +# bc_z: ====================================================================0.168166 # +# roboturk: ================================================================0.000131 # +# toto: ====================================================================0.000228 # +# ucsd_kitchen_dataset_converted_externally_to_rlds: =======================0.000006 # +# iamlab_cmu_pickup_insert_converted_externally_to_rlds: ===================0.000102 # +###################################################################################### + +10/11 [16:38:58] INFO | >> [*] Threads per Dataset: [14 1 1 1 1 1 1 2 1 1 1 1 1 5 1 1 1 1] dataset.py:563 + INFO | >> [*] Reads per Dataset: [14 1 1 1 1 1 1 2 1 1 1 1 1 5 1 1 1 1] dataset.py:564 + INFO | >> [*] Constructing datasets... dataset.py:567 +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +214************** +10/11 [16:39:03] INFO | >> [*] Applying frame transforms on dataset... dataset.py:607 +****** after RLDSDataset initialization! +****** length of the dataset: 7154275 +****** Build rlds train dataset: IterableDatasetWrapper successfully. +****** path: None +****** Skip AgiBotWorld-Alpha open-source-real-world; path not found: None +****** After build vla train dataset... +****** iterable_sources: [, ] +****** Before build mixed iterable dataset... +****** Build vla train dataloader successfully! +************************* Build train_dataloader successful! +************************* Before build_inf_evaluators + WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:4807: UserWarning: No warnings.py:109 + device id is provided via `init_process_group` or `barrier `. Using the current device set by the user. + warnings.warn( # warn only once + +************************* Build evaluators successful! +************************* Early exit flags: early_exit=False +PROPRIO_DIM 16 does not match ACTION_DIM 16 for AffordVLA +************************* Initialize model successful! +***** state_dict_path: /vast/users/xiaodan/zhangjian/molmo_data/Molmo-7B-D-0924/model.pt +***** Load checkpoint successful! +missing keys: ['action_head.model.layer_norm1.weight', 'action_head.model.layer_norm1.bias', 'action_head.model.fc1.weight', 'action_head.model.fc1.bias', 'action_head.model.mlp_resnet_blocks.0.ffn.0.weight', 'action_head.model.mlp_resnet_blocks.0.ffn.0.bias', 'action_head.model.mlp_resnet_blocks.0.ffn.1.weight', 'action_head.model.mlp_resnet_blocks.0.ffn.1.bias', 'action_head.model.mlp_resnet_blocks.1.ffn.0.weight', 'action_head.model.mlp_resnet_blocks.1.ffn.0.bias', 'action_head.model.mlp_resnet_blocks.1.ffn.1.weight', 'action_head.model.mlp_resnet_blocks.1.ffn.1.bias', 'action_head.model.layer_norm2.weight', 'action_head.model.layer_norm2.bias', 'action_head.model.fc2.weight', 'action_head.model.fc2.bias', 'proprio_projector.fc1.weight', 'proprio_projector.fc1.bias', 'proprio_projector.fc2.weight', 'proprio_projector.fc2.bias'] +unexpected keys: [] +************************* Initialize model successful! +************************* Before FSDP model wrapping +************************* FSDP model wrapping successful! +************************* Before building optimizer and scheduler +10/11 [16:40:36] INFO | >> Constructing optimizer with 2 param groups optim.py:1283 +************************************************** +After building optimizer and scheduler and model, before training, peak GPU memory (MB): 35614 +************************* VLATrainer initialized successfully! +************************* Before trainer.fit() +Pre-train system metrics + System/Peak GPU Memory (MB)=35,614 +[step=1/500000] + train/ActionL1Loss=0.5824 + throughput/total_tokens=192,000 + System/Peak GPU Memory (MB)=40,153 +[step=2/500000] + train/ActionL1Loss=0.5473 + throughput/total_tokens=384,000 + throughput/device/tokens_per_second=1,167 + throughput/device/batches_per_second=0.0486 + System/Peak GPU Memory (MB)=46,924 +[step=3/500000] + train/ActionL1Loss=0.6003 + throughput/total_tokens=576,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=4/500000] + train/ActionL1Loss=0.5933 + throughput/total_tokens=768,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=5/500000] + train/ActionL1Loss=0.5078 + throughput/total_tokens=960,000 + throughput/device/tokens_per_second=1,163 + throughput/device/batches_per_second=0.0485 +[step=6/500000] + train/ActionL1Loss=0.5089 + throughput/total_tokens=1,152,000 + throughput/device/tokens_per_second=1,163 + throughput/device/batches_per_second=0.0485 +[step=7/500000] + train/ActionL1Loss=0.4652 + throughput/total_tokens=1,344,000 + throughput/device/tokens_per_second=1,164 + throughput/device/batches_per_second=0.0485 +[step=8/500000] + train/ActionL1Loss=0.4365 + throughput/total_tokens=1,536,000 + throughput/device/tokens_per_second=1,165 + throughput/device/batches_per_second=0.0486 +[step=9/500000] + train/ActionL1Loss=0.4633 + throughput/total_tokens=1,728,000 + throughput/device/tokens_per_second=1,164 + throughput/device/batches_per_second=0.0485 +[step=10/500000] + train/ActionL1Loss=0.3726 + throughput/total_tokens=1,920,000 + throughput/device/tokens_per_second=1,166 + throughput/device/batches_per_second=0.0486 + System/Peak GPU Memory (MB)=46,924 +[step=11/500000] + train/ActionL1Loss=0.3470 + throughput/total_tokens=2,112,000 + throughput/device/tokens_per_second=1,167 + throughput/device/batches_per_second=0.0486 +[step=12/500000] + train/ActionL1Loss=0.3971 + throughput/total_tokens=2,304,000 + throughput/device/tokens_per_second=1,166 + throughput/device/batches_per_second=0.0486 +[step=13/500000] + train/ActionL1Loss=0.3305 + throughput/total_tokens=2,496,000 + throughput/device/tokens_per_second=1,167 + throughput/device/batches_per_second=0.0487 +[step=14/500000] + train/ActionL1Loss=0.3225 + throughput/total_tokens=2,688,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=15/500000] + train/ActionL1Loss=0.3732 + throughput/total_tokens=2,880,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=16/500000] + train/ActionL1Loss=0.2990 + throughput/total_tokens=3,072,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=17/500000] + train/ActionL1Loss=0.3297 + throughput/total_tokens=3,264,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=18/500000] + train/ActionL1Loss=0.3077 + throughput/total_tokens=3,456,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=19/500000] + train/ActionL1Loss=0.3155 + throughput/total_tokens=3,648,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=20/500000] + optim/total_grad_norm=14.58 + train/ActionL1Loss=0.3113 + throughput/total_tokens=3,840,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 + System/Peak GPU Memory (MB)=46,924 +[step=21/500000] + train/ActionL1Loss=0.3053 + throughput/total_tokens=4,032,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=22/500000] + train/ActionL1Loss=0.4309 + throughput/total_tokens=4,224,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=23/500000] + train/ActionL1Loss=0.3468 + throughput/total_tokens=4,416,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=24/500000] + train/ActionL1Loss=0.2505 + throughput/total_tokens=4,608,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=25/500000] + train/ActionL1Loss=0.3106 + throughput/total_tokens=4,800,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=26/500000] + train/ActionL1Loss=0.2877 + throughput/total_tokens=4,992,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=27/500000] + train/ActionL1Loss=0.2973 + throughput/total_tokens=5,184,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=28/500000] + train/ActionL1Loss=0.2676 + throughput/total_tokens=5,376,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=29/500000] + train/ActionL1Loss=0.2826 + throughput/total_tokens=5,568,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=30/500000] + train/ActionL1Loss=0.3036 + throughput/total_tokens=5,760,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 + System/Peak GPU Memory (MB)=46,924 +[step=31/500000] + train/ActionL1Loss=0.2350 + throughput/total_tokens=5,952,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=32/500000] + train/ActionL1Loss=0.2683 + throughput/total_tokens=6,144,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=33/500000] + train/ActionL1Loss=0.2923 + throughput/total_tokens=6,336,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=34/500000] + train/ActionL1Loss=0.3006 + throughput/total_tokens=6,528,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=35/500000] + train/ActionL1Loss=0.2875 + throughput/total_tokens=6,720,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=36/500000] + train/ActionL1Loss=0.2558 + throughput/total_tokens=6,912,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=37/500000] + train/ActionL1Loss=0.2568 + throughput/total_tokens=7,104,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=38/500000] + train/ActionL1Loss=0.2753 + throughput/total_tokens=7,296,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=39/500000] + train/ActionL1Loss=0.3441 + throughput/total_tokens=7,488,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=40/500000] + optim/total_grad_norm=18.95 + train/ActionL1Loss=0.2511 + throughput/total_tokens=7,680,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=41/500000] + train/ActionL1Loss=0.2689 + throughput/total_tokens=7,872,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=42/500000] + train/ActionL1Loss=0.2639 + throughput/total_tokens=8,064,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=43/500000] + train/ActionL1Loss=0.2563 + throughput/total_tokens=8,256,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=44/500000] + train/ActionL1Loss=0.2877 + throughput/total_tokens=8,448,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=45/500000] + train/ActionL1Loss=0.2616 + throughput/total_tokens=8,640,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=46/500000] + train/ActionL1Loss=0.2846 + throughput/total_tokens=8,832,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=47/500000] + train/ActionL1Loss=0.3060 + throughput/total_tokens=9,024,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=48/500000] + train/ActionL1Loss=0.2967 + throughput/total_tokens=9,216,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=49/500000] + train/ActionL1Loss=0.2511 + throughput/total_tokens=9,408,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=50/500000] + train/ActionL1Loss=0.2587 + throughput/total_tokens=9,600,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=51/500000] + train/ActionL1Loss=0.2510 + throughput/total_tokens=9,792,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=52/500000] + train/ActionL1Loss=0.2628 + throughput/total_tokens=9,984,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=53/500000] + train/ActionL1Loss=0.2522 + throughput/total_tokens=10,176,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=54/500000] + train/ActionL1Loss=0.2359 + throughput/total_tokens=10,368,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=55/500000] + train/ActionL1Loss=0.2914 + throughput/total_tokens=10,560,000 + throughput/device/tokens_per_second=1,167 + throughput/device/batches_per_second=0.0487 +[step=56/500000] + train/ActionL1Loss=0.2837 + throughput/total_tokens=10,752,000 + throughput/device/tokens_per_second=1,167 + throughput/device/batches_per_second=0.0486 +[step=57/500000] + train/ActionL1Loss=0.2476 + throughput/total_tokens=10,944,000 + throughput/device/tokens_per_second=1,167 + throughput/device/batches_per_second=0.0486 +[step=58/500000] + train/ActionL1Loss=0.2326 + throughput/total_tokens=11,136,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=59/500000] + train/ActionL1Loss=0.2587 + throughput/total_tokens=11,328,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=60/500000] + optim/total_grad_norm=13.71 + train/ActionL1Loss=0.2739 + throughput/total_tokens=11,520,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 + System/Peak GPU Memory (MB)=46,924 +[step=61/500000] + train/ActionL1Loss=0.2727 + throughput/total_tokens=11,712,000 + throughput/device/tokens_per_second=1,167 + throughput/device/batches_per_second=0.0487 +[step=62/500000] + train/ActionL1Loss=0.2891 + throughput/total_tokens=11,904,000 + throughput/device/tokens_per_second=1,167 + throughput/device/batches_per_second=0.0486 +[step=63/500000] + train/ActionL1Loss=0.2565 + throughput/total_tokens=12,096,000 + throughput/device/tokens_per_second=1,167 + throughput/device/batches_per_second=0.0487 +[step=64/500000] + train/ActionL1Loss=0.3131 + throughput/total_tokens=12,288,000 + throughput/device/tokens_per_second=1,167 + throughput/device/batches_per_second=0.0486 +[step=65/500000] + train/ActionL1Loss=0.2744 + throughput/total_tokens=12,480,000 + throughput/device/tokens_per_second=1,166 + throughput/device/batches_per_second=0.0486 +[step=66/500000] + train/ActionL1Loss=0.2431 + throughput/total_tokens=12,672,000 + throughput/device/tokens_per_second=1,167 + throughput/device/batches_per_second=0.0486 +[step=67/500000] + train/ActionL1Loss=0.2131 + throughput/total_tokens=12,864,000 + throughput/device/tokens_per_second=1,167 + throughput/device/batches_per_second=0.0487 +[step=68/500000] + train/ActionL1Loss=0.2364 + throughput/total_tokens=13,056,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=69/500000] + train/ActionL1Loss=0.2208 + throughput/total_tokens=13,248,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=70/500000] + train/ActionL1Loss=0.1769 + throughput/total_tokens=13,440,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 + System/Peak GPU Memory (MB)=46,924 +[step=71/500000] + train/ActionL1Loss=0.2248 + throughput/total_tokens=13,632,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=72/500000] + train/ActionL1Loss=0.2469 + throughput/total_tokens=13,824,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=73/500000] + train/ActionL1Loss=0.2897 + throughput/total_tokens=14,016,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=74/500000] + train/ActionL1Loss=0.2338 + throughput/total_tokens=14,208,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=75/500000] + train/ActionL1Loss=0.2287 + throughput/total_tokens=14,400,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=76/500000] + train/ActionL1Loss=0.2439 + throughput/total_tokens=14,592,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=77/500000] + train/ActionL1Loss=0.2083 + throughput/total_tokens=14,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=78/500000] + train/ActionL1Loss=0.2782 + throughput/total_tokens=14,976,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=79/500000] + train/ActionL1Loss=0.3028 + throughput/total_tokens=15,168,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=80/500000] + optim/total_grad_norm=19.70 + train/ActionL1Loss=0.2559 + throughput/total_tokens=15,360,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=81/500000] + train/ActionL1Loss=0.2359 + throughput/total_tokens=15,552,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=82/500000] + train/ActionL1Loss=0.2536 + throughput/total_tokens=15,744,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=83/500000] + train/ActionL1Loss=0.2748 + throughput/total_tokens=15,936,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=84/500000] + train/ActionL1Loss=0.2230 + throughput/total_tokens=16,128,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=85/500000] + train/ActionL1Loss=0.2397 + throughput/total_tokens=16,320,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=86/500000] + train/ActionL1Loss=0.2507 + throughput/total_tokens=16,512,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=87/500000] + train/ActionL1Loss=0.2094 + throughput/total_tokens=16,704,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=88/500000] + train/ActionL1Loss=0.2115 + throughput/total_tokens=16,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=89/500000] + train/ActionL1Loss=0.1963 + throughput/total_tokens=17,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=90/500000] + train/ActionL1Loss=0.2155 + throughput/total_tokens=17,280,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=91/500000] + train/ActionL1Loss=0.2281 + throughput/total_tokens=17,472,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=92/500000] + train/ActionL1Loss=0.2364 + throughput/total_tokens=17,664,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=93/500000] + train/ActionL1Loss=0.2110 + throughput/total_tokens=17,856,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=94/500000] + train/ActionL1Loss=0.1941 + throughput/total_tokens=18,048,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=95/500000] + train/ActionL1Loss=0.1911 + throughput/total_tokens=18,240,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=96/500000] + train/ActionL1Loss=0.1907 + throughput/total_tokens=18,432,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=97/500000] + train/ActionL1Loss=0.1833 + throughput/total_tokens=18,624,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=98/500000] + train/ActionL1Loss=0.2025 + throughput/total_tokens=18,816,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=99/500000] + train/ActionL1Loss=0.2037 + throughput/total_tokens=19,008,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=100/500000] + optim/total_grad_norm=16.55 + train/ActionL1Loss=0.1965 + throughput/total_tokens=19,200,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=101/500000] + train/ActionL1Loss=0.2040 + throughput/total_tokens=19,392,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=102/500000] + train/ActionL1Loss=0.2074 + throughput/total_tokens=19,584,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=103/500000] + train/ActionL1Loss=0.2018 + throughput/total_tokens=19,776,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=104/500000] + train/ActionL1Loss=0.2015 + throughput/total_tokens=19,968,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=105/500000] + train/ActionL1Loss=0.2192 + throughput/total_tokens=20,160,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=106/500000] + train/ActionL1Loss=0.1984 + throughput/total_tokens=20,352,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=107/500000] + train/ActionL1Loss=0.2214 + throughput/total_tokens=20,544,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=108/500000] + train/ActionL1Loss=0.2033 + throughput/total_tokens=20,736,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=109/500000] + train/ActionL1Loss=0.2141 + throughput/total_tokens=20,928,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=110/500000] + train/ActionL1Loss=0.2136 + throughput/total_tokens=21,120,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 + System/Peak GPU Memory (MB)=46,924 +[step=111/500000] + train/ActionL1Loss=0.2100 + throughput/total_tokens=21,312,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=112/500000] + train/ActionL1Loss=0.2023 + throughput/total_tokens=21,504,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=113/500000] + train/ActionL1Loss=0.1877 + throughput/total_tokens=21,696,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=114/500000] + train/ActionL1Loss=0.1921 + throughput/total_tokens=21,888,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=115/500000] + train/ActionL1Loss=0.1931 + throughput/total_tokens=22,080,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=116/500000] + train/ActionL1Loss=0.1967 + throughput/total_tokens=22,272,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=117/500000] + train/ActionL1Loss=0.1702 + throughput/total_tokens=22,464,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=118/500000] + train/ActionL1Loss=0.1755 + throughput/total_tokens=22,656,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=119/500000] + train/ActionL1Loss=0.1890 + throughput/total_tokens=22,848,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=120/500000] + optim/total_grad_norm=20.86 + train/ActionL1Loss=0.1871 + throughput/total_tokens=23,040,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=121/500000] + train/ActionL1Loss=0.2069 + throughput/total_tokens=23,232,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=122/500000] + train/ActionL1Loss=0.1675 + throughput/total_tokens=23,424,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=123/500000] + train/ActionL1Loss=0.1850 + throughput/total_tokens=23,616,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=124/500000] + train/ActionL1Loss=0.1881 + throughput/total_tokens=23,808,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=125/500000] + train/ActionL1Loss=0.1656 + throughput/total_tokens=24,000,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=126/500000] + train/ActionL1Loss=0.1923 + throughput/total_tokens=24,192,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=127/500000] + train/ActionL1Loss=0.1957 + throughput/total_tokens=24,384,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=128/500000] + train/ActionL1Loss=0.1908 + throughput/total_tokens=24,576,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=129/500000] + train/ActionL1Loss=0.1928 + throughput/total_tokens=24,768,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=130/500000] + train/ActionL1Loss=0.1703 + throughput/total_tokens=24,960,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=131/500000] + train/ActionL1Loss=0.1718 + throughput/total_tokens=25,152,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=132/500000] + train/ActionL1Loss=0.1656 + throughput/total_tokens=25,344,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=133/500000] + train/ActionL1Loss=0.1696 + throughput/total_tokens=25,536,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=134/500000] + train/ActionL1Loss=0.1618 + throughput/total_tokens=25,728,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=135/500000] + train/ActionL1Loss=0.1704 + throughput/total_tokens=25,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=136/500000] + train/ActionL1Loss=0.1710 + throughput/total_tokens=26,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=137/500000] + train/ActionL1Loss=0.1633 + throughput/total_tokens=26,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=138/500000] + train/ActionL1Loss=0.1952 + throughput/total_tokens=26,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=139/500000] + train/ActionL1Loss=0.1538 + throughput/total_tokens=26,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=140/500000] + optim/total_grad_norm=20.37 + train/ActionL1Loss=0.1801 + throughput/total_tokens=26,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=141/500000] + train/ActionL1Loss=0.1855 + throughput/total_tokens=27,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=142/500000] + train/ActionL1Loss=0.1567 + throughput/total_tokens=27,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=143/500000] + train/ActionL1Loss=0.1607 + throughput/total_tokens=27,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=144/500000] + train/ActionL1Loss=0.1611 + throughput/total_tokens=27,648,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=145/500000] + train/ActionL1Loss=0.1599 + throughput/total_tokens=27,840,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=146/500000] + train/ActionL1Loss=0.1650 + throughput/total_tokens=28,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=147/500000] + train/ActionL1Loss=0.1726 + throughput/total_tokens=28,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=148/500000] + train/ActionL1Loss=0.1650 + throughput/total_tokens=28,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=149/500000] + train/ActionL1Loss=0.1722 + throughput/total_tokens=28,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=150/500000] + train/ActionL1Loss=0.1710 + throughput/total_tokens=28,800,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=151/500000] + train/ActionL1Loss=0.1650 + throughput/total_tokens=28,992,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=152/500000] + train/ActionL1Loss=0.1801 + throughput/total_tokens=29,184,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=153/500000] + train/ActionL1Loss=0.1778 + throughput/total_tokens=29,376,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=154/500000] + train/ActionL1Loss=0.1752 + throughput/total_tokens=29,568,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=155/500000] + train/ActionL1Loss=0.1650 + throughput/total_tokens=29,760,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=156/500000] + train/ActionL1Loss=0.1663 + throughput/total_tokens=29,952,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=157/500000] + train/ActionL1Loss=0.1650 + throughput/total_tokens=30,144,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=158/500000] + train/ActionL1Loss=0.1611 + throughput/total_tokens=30,336,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=159/500000] + train/ActionL1Loss=0.1649 + throughput/total_tokens=30,528,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=160/500000] + optim/total_grad_norm=14.83 + train/ActionL1Loss=0.1519 + throughput/total_tokens=30,720,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=161/500000] + train/ActionL1Loss=0.1632 + throughput/total_tokens=30,912,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=162/500000] + train/ActionL1Loss=0.1706 + throughput/total_tokens=31,104,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=163/500000] + train/ActionL1Loss=0.1544 + throughput/total_tokens=31,296,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=164/500000] + train/ActionL1Loss=0.1645 + throughput/total_tokens=31,488,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=165/500000] + train/ActionL1Loss=0.1474 + throughput/total_tokens=31,680,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=166/500000] + train/ActionL1Loss=0.1605 + throughput/total_tokens=31,872,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=167/500000] + train/ActionL1Loss=0.1563 + throughput/total_tokens=32,064,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=168/500000] + train/ActionL1Loss=0.1560 + throughput/total_tokens=32,256,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=169/500000] + train/ActionL1Loss=0.1664 + throughput/total_tokens=32,448,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=170/500000] + train/ActionL1Loss=0.1600 + throughput/total_tokens=32,640,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=171/500000] + train/ActionL1Loss=0.1549 + throughput/total_tokens=32,832,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=172/500000] + train/ActionL1Loss=0.1448 + throughput/total_tokens=33,024,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=173/500000] + train/ActionL1Loss=0.1456 + throughput/total_tokens=33,216,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=174/500000] + train/ActionL1Loss=0.1485 + throughput/total_tokens=33,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=175/500000] + train/ActionL1Loss=0.1512 + throughput/total_tokens=33,600,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=176/500000] + train/ActionL1Loss=0.1417 + throughput/total_tokens=33,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=177/500000] + train/ActionL1Loss=0.1542 + throughput/total_tokens=33,984,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=178/500000] + train/ActionL1Loss=0.1469 + throughput/total_tokens=34,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=179/500000] + train/ActionL1Loss=0.1560 + throughput/total_tokens=34,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=180/500000] + optim/total_grad_norm=21.65 + train/ActionL1Loss=0.1698 + throughput/total_tokens=34,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=181/500000] + train/ActionL1Loss=0.1420 + throughput/total_tokens=34,752,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=182/500000] + train/ActionL1Loss=0.1453 + throughput/total_tokens=34,944,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=183/500000] + train/ActionL1Loss=0.1382 + throughput/total_tokens=35,136,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=184/500000] + train/ActionL1Loss=0.1492 + throughput/total_tokens=35,328,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=185/500000] + train/ActionL1Loss=0.1497 + throughput/total_tokens=35,520,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=186/500000] + train/ActionL1Loss=0.1269 + throughput/total_tokens=35,712,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=187/500000] + train/ActionL1Loss=0.1420 + throughput/total_tokens=35,904,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=188/500000] + train/ActionL1Loss=0.1390 + throughput/total_tokens=36,096,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=189/500000] + train/ActionL1Loss=0.1384 + throughput/total_tokens=36,288,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=190/500000] + train/ActionL1Loss=0.1459 + throughput/total_tokens=36,480,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=191/500000] + train/ActionL1Loss=0.1492 + throughput/total_tokens=36,672,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=192/500000] + train/ActionL1Loss=0.1339 + throughput/total_tokens=36,864,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=193/500000] + train/ActionL1Loss=0.1347 + throughput/total_tokens=37,056,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=194/500000] + train/ActionL1Loss=0.1347 + throughput/total_tokens=37,248,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=195/500000] + train/ActionL1Loss=0.1304 + throughput/total_tokens=37,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=196/500000] + train/ActionL1Loss=0.1386 + throughput/total_tokens=37,632,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=197/500000] + train/ActionL1Loss=0.1339 + throughput/total_tokens=37,824,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=198/500000] + train/ActionL1Loss=0.1438 + throughput/total_tokens=38,016,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=199/500000] + train/ActionL1Loss=0.1355 + throughput/total_tokens=38,208,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=200/500000] + optim/total_grad_norm=15.30 + train/ActionL1Loss=0.1480 + throughput/total_tokens=38,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=201/500000] + train/ActionL1Loss=0.1397 + throughput/total_tokens=38,592,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=202/500000] + train/ActionL1Loss=0.1426 + throughput/total_tokens=38,784,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=203/500000] + train/ActionL1Loss=0.1330 + throughput/total_tokens=38,976,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=204/500000] + train/ActionL1Loss=0.1385 + throughput/total_tokens=39,168,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=205/500000] + train/ActionL1Loss=0.1340 + throughput/total_tokens=39,360,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=206/500000] + train/ActionL1Loss=0.1248 + throughput/total_tokens=39,552,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=207/500000] + train/ActionL1Loss=0.1424 + throughput/total_tokens=39,744,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=208/500000] + train/ActionL1Loss=0.1302 + throughput/total_tokens=39,936,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=209/500000] + train/ActionL1Loss=0.1369 + throughput/total_tokens=40,128,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=210/500000] + train/ActionL1Loss=0.1316 + throughput/total_tokens=40,320,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=211/500000] + train/ActionL1Loss=0.1308 + throughput/total_tokens=40,512,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=212/500000] + train/ActionL1Loss=0.1371 + throughput/total_tokens=40,704,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=213/500000] + train/ActionL1Loss=0.1447 + throughput/total_tokens=40,896,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=214/500000] + train/ActionL1Loss=0.1348 + throughput/total_tokens=41,088,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=215/500000] + train/ActionL1Loss=0.1230 + throughput/total_tokens=41,280,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=216/500000] + train/ActionL1Loss=0.1275 + throughput/total_tokens=41,472,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=217/500000] + train/ActionL1Loss=0.1374 + throughput/total_tokens=41,664,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=218/500000] + train/ActionL1Loss=0.1280 + throughput/total_tokens=41,856,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=219/500000] + train/ActionL1Loss=0.1347 + throughput/total_tokens=42,048,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=220/500000] + optim/total_grad_norm=20.02 + train/ActionL1Loss=0.1404 + throughput/total_tokens=42,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=221/500000] + train/ActionL1Loss=0.1304 + throughput/total_tokens=42,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=222/500000] + train/ActionL1Loss=0.1294 + throughput/total_tokens=42,624,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=223/500000] + train/ActionL1Loss=0.1486 + throughput/total_tokens=42,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=224/500000] + train/ActionL1Loss=0.1186 + throughput/total_tokens=43,008,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=225/500000] + train/ActionL1Loss=0.1386 + throughput/total_tokens=43,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=226/500000] + train/ActionL1Loss=0.1456 + throughput/total_tokens=43,392,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=227/500000] + train/ActionL1Loss=0.1369 + throughput/total_tokens=43,584,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=228/500000] + train/ActionL1Loss=0.1365 + throughput/total_tokens=43,776,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=229/500000] + train/ActionL1Loss=0.1419 + throughput/total_tokens=43,968,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=230/500000] + train/ActionL1Loss=0.1342 + throughput/total_tokens=44,160,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=231/500000] + train/ActionL1Loss=0.1341 + throughput/total_tokens=44,352,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=232/500000] + train/ActionL1Loss=0.1360 + throughput/total_tokens=44,544,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=233/500000] + train/ActionL1Loss=0.1332 + throughput/total_tokens=44,736,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=234/500000] + train/ActionL1Loss=0.1431 + throughput/total_tokens=44,928,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=235/500000] + train/ActionL1Loss=0.1446 + throughput/total_tokens=45,120,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=236/500000] + train/ActionL1Loss=0.1298 + throughput/total_tokens=45,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=237/500000] + train/ActionL1Loss=0.1313 + throughput/total_tokens=45,504,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=238/500000] + train/ActionL1Loss=0.1442 + throughput/total_tokens=45,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=239/500000] + train/ActionL1Loss=0.1537 + throughput/total_tokens=45,888,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=240/500000] + optim/total_grad_norm=23.66 + train/ActionL1Loss=0.1382 + throughput/total_tokens=46,080,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=241/500000] + train/ActionL1Loss=0.1368 + throughput/total_tokens=46,272,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=242/500000] + train/ActionL1Loss=0.1339 + throughput/total_tokens=46,464,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=243/500000] + train/ActionL1Loss=0.1411 + throughput/total_tokens=46,656,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=244/500000] + train/ActionL1Loss=0.1207 + throughput/total_tokens=46,848,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=245/500000] + train/ActionL1Loss=0.1373 + throughput/total_tokens=47,040,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=246/500000] + train/ActionL1Loss=0.1452 + throughput/total_tokens=47,232,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=247/500000] + train/ActionL1Loss=0.1275 + throughput/total_tokens=47,424,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=248/500000] + train/ActionL1Loss=0.1224 + throughput/total_tokens=47,616,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=249/500000] + train/ActionL1Loss=0.1223 + throughput/total_tokens=47,808,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=250/500000] + train/ActionL1Loss=0.1230 + throughput/total_tokens=48,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=251/500000] + train/ActionL1Loss=0.1156 + throughput/total_tokens=48,192,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=252/500000] + train/ActionL1Loss=0.1203 + throughput/total_tokens=48,384,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=253/500000] + train/ActionL1Loss=0.1292 + throughput/total_tokens=48,576,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=254/500000] + train/ActionL1Loss=0.1157 + throughput/total_tokens=48,768,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=255/500000] + train/ActionL1Loss=0.1340 + throughput/total_tokens=48,960,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=256/500000] + train/ActionL1Loss=0.1239 + throughput/total_tokens=49,152,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=257/500000] + train/ActionL1Loss=0.1194 + throughput/total_tokens=49,344,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=258/500000] + train/ActionL1Loss=0.1191 + throughput/total_tokens=49,536,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=259/500000] + train/ActionL1Loss=0.1205 + throughput/total_tokens=49,728,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=260/500000] + optim/total_grad_norm=17.94 + train/ActionL1Loss=0.1245 + throughput/total_tokens=49,920,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=261/500000] + train/ActionL1Loss=0.1391 + throughput/total_tokens=50,112,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=262/500000] + train/ActionL1Loss=0.1232 + throughput/total_tokens=50,304,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=263/500000] + train/ActionL1Loss=0.1320 + throughput/total_tokens=50,496,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=264/500000] + train/ActionL1Loss=0.1201 + throughput/total_tokens=50,688,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=265/500000] + train/ActionL1Loss=0.1300 + throughput/total_tokens=50,880,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=266/500000] + train/ActionL1Loss=0.1277 + throughput/total_tokens=51,072,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=267/500000] + train/ActionL1Loss=0.1250 + throughput/total_tokens=51,264,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=268/500000] + train/ActionL1Loss=0.1211 + throughput/total_tokens=51,456,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=269/500000] + train/ActionL1Loss=0.1200 + throughput/total_tokens=51,648,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=270/500000] + train/ActionL1Loss=0.1142 + throughput/total_tokens=51,840,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=271/500000] + train/ActionL1Loss=0.1149 + throughput/total_tokens=52,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=272/500000] + train/ActionL1Loss=0.1321 + throughput/total_tokens=52,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=273/500000] + train/ActionL1Loss=0.1253 + throughput/total_tokens=52,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=274/500000] + train/ActionL1Loss=0.1133 + throughput/total_tokens=52,608,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=275/500000] + train/ActionL1Loss=0.1202 + throughput/total_tokens=52,800,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=276/500000] + train/ActionL1Loss=0.1262 + throughput/total_tokens=52,992,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=277/500000] + train/ActionL1Loss=0.1457 + throughput/total_tokens=53,184,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=278/500000] + train/ActionL1Loss=0.1298 + throughput/total_tokens=53,376,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=279/500000] + train/ActionL1Loss=0.1251 + throughput/total_tokens=53,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=280/500000] + optim/total_grad_norm=19.82 + train/ActionL1Loss=0.1296 + throughput/total_tokens=53,760,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=281/500000] + train/ActionL1Loss=0.1376 + throughput/total_tokens=53,952,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=282/500000] + train/ActionL1Loss=0.1402 + throughput/total_tokens=54,144,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=283/500000] + train/ActionL1Loss=0.1284 + throughput/total_tokens=54,336,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=284/500000] + train/ActionL1Loss=0.1167 + throughput/total_tokens=54,528,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=285/500000] + train/ActionL1Loss=0.1142 + throughput/total_tokens=54,720,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=286/500000] + train/ActionL1Loss=0.1213 + throughput/total_tokens=54,912,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=287/500000] + train/ActionL1Loss=0.1195 + throughput/total_tokens=55,104,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=288/500000] + train/ActionL1Loss=0.1156 + throughput/total_tokens=55,296,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=289/500000] + train/ActionL1Loss=0.1299 + throughput/total_tokens=55,488,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=290/500000] + train/ActionL1Loss=0.1167 + throughput/total_tokens=55,680,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=291/500000] + train/ActionL1Loss=0.1123 + throughput/total_tokens=55,872,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=292/500000] + train/ActionL1Loss=0.1186 + throughput/total_tokens=56,064,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=293/500000] + train/ActionL1Loss=0.1366 + throughput/total_tokens=56,256,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=294/500000] + train/ActionL1Loss=0.1302 + throughput/total_tokens=56,448,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=295/500000] + train/ActionL1Loss=0.1301 + throughput/total_tokens=56,640,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=296/500000] + train/ActionL1Loss=0.1264 + throughput/total_tokens=56,832,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=297/500000] + train/ActionL1Loss=0.1248 + throughput/total_tokens=57,024,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=298/500000] + train/ActionL1Loss=0.1176 + throughput/total_tokens=57,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=299/500000] + train/ActionL1Loss=0.1191 + throughput/total_tokens=57,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=300/500000] + optim/total_grad_norm=22.15 + train/ActionL1Loss=0.1359 + throughput/total_tokens=57,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=301/500000] + train/ActionL1Loss=0.1237 + throughput/total_tokens=57,792,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=302/500000] + train/ActionL1Loss=0.1349 + throughput/total_tokens=57,984,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=303/500000] + train/ActionL1Loss=0.1329 + throughput/total_tokens=58,176,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=304/500000] + train/ActionL1Loss=0.1150 + throughput/total_tokens=58,368,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=305/500000] + train/ActionL1Loss=0.1297 + throughput/total_tokens=58,560,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=306/500000] + train/ActionL1Loss=0.1436 + throughput/total_tokens=58,752,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=307/500000] + train/ActionL1Loss=0.1356 + throughput/total_tokens=58,944,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=308/500000] + train/ActionL1Loss=0.1316 + throughput/total_tokens=59,136,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=309/500000] + train/ActionL1Loss=0.1251 + throughput/total_tokens=59,328,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=310/500000] + train/ActionL1Loss=0.1479 + throughput/total_tokens=59,520,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=311/500000] + train/ActionL1Loss=0.1301 + throughput/total_tokens=59,712,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=312/500000] + train/ActionL1Loss=0.1276 + throughput/total_tokens=59,904,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=313/500000] + train/ActionL1Loss=0.1304 + throughput/total_tokens=60,096,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=314/500000] + train/ActionL1Loss=0.1346 + throughput/total_tokens=60,288,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=315/500000] + train/ActionL1Loss=0.1319 + throughput/total_tokens=60,480,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=316/500000] + train/ActionL1Loss=0.1273 + throughput/total_tokens=60,672,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=317/500000] + train/ActionL1Loss=0.1406 + throughput/total_tokens=60,864,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=318/500000] + train/ActionL1Loss=0.1422 + throughput/total_tokens=61,056,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=319/500000] + train/ActionL1Loss=0.1378 + throughput/total_tokens=61,248,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=320/500000] + optim/total_grad_norm=19.95 + train/ActionL1Loss=0.1265 + throughput/total_tokens=61,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=321/500000] + train/ActionL1Loss=0.1261 + throughput/total_tokens=61,632,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=322/500000] + train/ActionL1Loss=0.1292 + throughput/total_tokens=61,824,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=323/500000] + train/ActionL1Loss=0.1510 + throughput/total_tokens=62,016,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=324/500000] + train/ActionL1Loss=0.1242 + throughput/total_tokens=62,208,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=325/500000] + train/ActionL1Loss=0.1334 + throughput/total_tokens=62,400,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=326/500000] + train/ActionL1Loss=0.1269 + throughput/total_tokens=62,592,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=327/500000] + train/ActionL1Loss=0.1299 + throughput/total_tokens=62,784,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=328/500000] + train/ActionL1Loss=0.1256 + throughput/total_tokens=62,976,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=329/500000] + train/ActionL1Loss=0.1343 + throughput/total_tokens=63,168,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=330/500000] + train/ActionL1Loss=0.1103 + throughput/total_tokens=63,360,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=331/500000] + train/ActionL1Loss=0.1395 + throughput/total_tokens=63,552,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=332/500000] + train/ActionL1Loss=0.1064 + throughput/total_tokens=63,744,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=333/500000] + train/ActionL1Loss=0.1206 + throughput/total_tokens=63,936,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=334/500000] + train/ActionL1Loss=0.1421 + throughput/total_tokens=64,128,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=335/500000] + train/ActionL1Loss=0.1447 + throughput/total_tokens=64,320,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=336/500000] + train/ActionL1Loss=0.1289 + throughput/total_tokens=64,512,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=337/500000] + train/ActionL1Loss=0.1301 + throughput/total_tokens=64,704,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=338/500000] + train/ActionL1Loss=0.1292 + throughput/total_tokens=64,896,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=339/500000] + train/ActionL1Loss=0.1307 + throughput/total_tokens=65,088,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=340/500000] + optim/total_grad_norm=15.78 + train/ActionL1Loss=0.1125 + throughput/total_tokens=65,280,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=341/500000] + train/ActionL1Loss=0.1321 + throughput/total_tokens=65,472,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=342/500000] + train/ActionL1Loss=0.1209 + throughput/total_tokens=65,664,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=343/500000] + train/ActionL1Loss=0.1241 + throughput/total_tokens=65,856,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=344/500000] + train/ActionL1Loss=0.1150 + throughput/total_tokens=66,048,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=345/500000] + train/ActionL1Loss=0.1281 + throughput/total_tokens=66,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=346/500000] + train/ActionL1Loss=0.1191 + throughput/total_tokens=66,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=347/500000] + train/ActionL1Loss=0.1313 + throughput/total_tokens=66,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=348/500000] + train/ActionL1Loss=0.1062 + throughput/total_tokens=66,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=349/500000] + train/ActionL1Loss=0.1081 + throughput/total_tokens=67,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=350/500000] + train/ActionL1Loss=0.1220 + throughput/total_tokens=67,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=351/500000] + train/ActionL1Loss=0.1166 + throughput/total_tokens=67,392,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=352/500000] + train/ActionL1Loss=0.1262 + throughput/total_tokens=67,584,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=353/500000] + train/ActionL1Loss=0.1324 + throughput/total_tokens=67,776,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=354/500000] + train/ActionL1Loss=0.1171 + throughput/total_tokens=67,968,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=355/500000] + train/ActionL1Loss=0.1129 + throughput/total_tokens=68,160,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=356/500000] + train/ActionL1Loss=0.1205 + throughput/total_tokens=68,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=357/500000] + train/ActionL1Loss=0.1095 + throughput/total_tokens=68,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=358/500000] + train/ActionL1Loss=0.1304 + throughput/total_tokens=68,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=359/500000] + train/ActionL1Loss=0.1221 + throughput/total_tokens=68,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=360/500000] + optim/total_grad_norm=18.64 + train/ActionL1Loss=0.1325 + throughput/total_tokens=69,120,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=361/500000] + train/ActionL1Loss=0.1135 + throughput/total_tokens=69,312,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=362/500000] + train/ActionL1Loss=0.1182 + throughput/total_tokens=69,504,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=363/500000] + train/ActionL1Loss=0.1128 + throughput/total_tokens=69,696,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=364/500000] + train/ActionL1Loss=0.1183 + throughput/total_tokens=69,888,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=365/500000] + train/ActionL1Loss=0.1222 + throughput/total_tokens=70,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=366/500000] + train/ActionL1Loss=0.1272 + throughput/total_tokens=70,272,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=367/500000] + train/ActionL1Loss=0.1088 + throughput/total_tokens=70,464,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=368/500000] + train/ActionL1Loss=0.1073 + throughput/total_tokens=70,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=369/500000] + train/ActionL1Loss=0.1373 + throughput/total_tokens=70,848,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=370/500000] + train/ActionL1Loss=0.1257 + throughput/total_tokens=71,040,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=371/500000] + train/ActionL1Loss=0.1209 + throughput/total_tokens=71,232,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=372/500000] + train/ActionL1Loss=0.1058 + throughput/total_tokens=71,424,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=373/500000] + train/ActionL1Loss=0.1278 + throughput/total_tokens=71,616,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=374/500000] + train/ActionL1Loss=0.1121 + throughput/total_tokens=71,808,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=375/500000] + train/ActionL1Loss=0.1091 + throughput/total_tokens=72,000,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=376/500000] + train/ActionL1Loss=0.1033 + throughput/total_tokens=72,192,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=377/500000] + train/ActionL1Loss=0.1182 + throughput/total_tokens=72,384,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=378/500000] + train/ActionL1Loss=0.1193 + throughput/total_tokens=72,576,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=379/500000] + train/ActionL1Loss=0.1153 + throughput/total_tokens=72,768,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=380/500000] + optim/total_grad_norm=17.95 + train/ActionL1Loss=0.1239 + throughput/total_tokens=72,960,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=381/500000] + train/ActionL1Loss=0.1233 + throughput/total_tokens=73,152,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=382/500000] + train/ActionL1Loss=0.1026 + throughput/total_tokens=73,344,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=383/500000] + train/ActionL1Loss=0.1242 + throughput/total_tokens=73,536,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=384/500000] + train/ActionL1Loss=0.1224 + throughput/total_tokens=73,728,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=385/500000] + train/ActionL1Loss=0.1048 + throughput/total_tokens=73,920,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=386/500000] + train/ActionL1Loss=0.1308 + throughput/total_tokens=74,112,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=387/500000] + train/ActionL1Loss=0.1075 + throughput/total_tokens=74,304,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=388/500000] + train/ActionL1Loss=0.1159 + throughput/total_tokens=74,496,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=389/500000] + train/ActionL1Loss=0.1139 + throughput/total_tokens=74,688,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=390/500000] + train/ActionL1Loss=0.1076 + throughput/total_tokens=74,880,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=391/500000] + train/ActionL1Loss=0.0975 + throughput/total_tokens=75,072,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=392/500000] + train/ActionL1Loss=0.1024 + throughput/total_tokens=75,264,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=393/500000] + train/ActionL1Loss=0.0942 + throughput/total_tokens=75,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=394/500000] + train/ActionL1Loss=0.1081 + throughput/total_tokens=75,648,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=395/500000] + train/ActionL1Loss=0.1064 + throughput/total_tokens=75,840,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=396/500000] + train/ActionL1Loss=0.1057 + throughput/total_tokens=76,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=397/500000] + train/ActionL1Loss=0.1118 + throughput/total_tokens=76,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=398/500000] + train/ActionL1Loss=0.1108 + throughput/total_tokens=76,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=399/500000] + train/ActionL1Loss=0.1104 + throughput/total_tokens=76,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=400/500000] + optim/total_grad_norm=17.58 + train/ActionL1Loss=0.1107 + throughput/total_tokens=76,800,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=401/500000] + train/ActionL1Loss=0.1009 + throughput/total_tokens=76,992,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=402/500000] + train/ActionL1Loss=0.0981 + throughput/total_tokens=77,184,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=403/500000] + train/ActionL1Loss=0.1078 + throughput/total_tokens=77,376,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=404/500000] + train/ActionL1Loss=0.1016 + throughput/total_tokens=77,568,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=405/500000] + train/ActionL1Loss=0.1114 + throughput/total_tokens=77,760,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=406/500000] + train/ActionL1Loss=0.1011 + throughput/total_tokens=77,952,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=407/500000] + train/ActionL1Loss=0.0923 + throughput/total_tokens=78,144,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=408/500000] + train/ActionL1Loss=0.1015 + throughput/total_tokens=78,336,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=409/500000] + train/ActionL1Loss=0.1003 + throughput/total_tokens=78,528,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=410/500000] + train/ActionL1Loss=0.1169 + throughput/total_tokens=78,720,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 + System/Peak GPU Memory (MB)=46,924 +[step=411/500000] + train/ActionL1Loss=0.1079 + throughput/total_tokens=78,912,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=412/500000] + train/ActionL1Loss=0.1002 + throughput/total_tokens=79,104,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=413/500000] + train/ActionL1Loss=0.1155 + throughput/total_tokens=79,296,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=414/500000] + train/ActionL1Loss=0.0994 + throughput/total_tokens=79,488,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=415/500000] + train/ActionL1Loss=0.1047 + throughput/total_tokens=79,680,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=416/500000] + train/ActionL1Loss=0.1063 + throughput/total_tokens=79,872,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=417/500000] + train/ActionL1Loss=0.1140 + throughput/total_tokens=80,064,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=418/500000] + train/ActionL1Loss=0.1181 + throughput/total_tokens=80,256,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=419/500000] + train/ActionL1Loss=0.0931 + throughput/total_tokens=80,448,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=420/500000] + optim/total_grad_norm=16.60 + train/ActionL1Loss=0.1036 + throughput/total_tokens=80,640,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=421/500000] + train/ActionL1Loss=0.1071 + throughput/total_tokens=80,832,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=422/500000] + train/ActionL1Loss=0.1145 + throughput/total_tokens=81,024,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=423/500000] + train/ActionL1Loss=0.1040 + throughput/total_tokens=81,216,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=424/500000] + train/ActionL1Loss=0.0989 + throughput/total_tokens=81,408,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=425/500000] + train/ActionL1Loss=0.0996 + throughput/total_tokens=81,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=426/500000] + train/ActionL1Loss=0.0854 + throughput/total_tokens=81,792,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=427/500000] + train/ActionL1Loss=0.1067 + throughput/total_tokens=81,984,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=428/500000] + train/ActionL1Loss=0.0997 + throughput/total_tokens=82,176,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=429/500000] + train/ActionL1Loss=0.1079 + throughput/total_tokens=82,368,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=430/500000] + train/ActionL1Loss=0.1174 + throughput/total_tokens=82,560,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=431/500000] + train/ActionL1Loss=0.1255 + throughput/total_tokens=82,752,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=432/500000] + train/ActionL1Loss=0.1135 + throughput/total_tokens=82,944,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=433/500000] + train/ActionL1Loss=0.1156 + throughput/total_tokens=83,136,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=434/500000] + train/ActionL1Loss=0.1209 + throughput/total_tokens=83,328,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=435/500000] + train/ActionL1Loss=0.1097 + throughput/total_tokens=83,520,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=436/500000] + train/ActionL1Loss=0.1028 + throughput/total_tokens=83,712,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=437/500000] + train/ActionL1Loss=0.1047 + throughput/total_tokens=83,904,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=438/500000] + train/ActionL1Loss=0.1213 + throughput/total_tokens=84,096,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=439/500000] + train/ActionL1Loss=0.1096 + throughput/total_tokens=84,288,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=440/500000] + optim/total_grad_norm=20.46 + train/ActionL1Loss=0.1065 + throughput/total_tokens=84,480,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=441/500000] + train/ActionL1Loss=0.1242 + throughput/total_tokens=84,672,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=442/500000] + train/ActionL1Loss=0.1248 + throughput/total_tokens=84,864,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=443/500000] + train/ActionL1Loss=0.1094 + throughput/total_tokens=85,056,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=444/500000] + train/ActionL1Loss=0.1172 + throughput/total_tokens=85,248,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=445/500000] + train/ActionL1Loss=0.1258 + throughput/total_tokens=85,440,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=446/500000] + train/ActionL1Loss=0.1247 + throughput/total_tokens=85,632,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=447/500000] + train/ActionL1Loss=0.1212 + throughput/total_tokens=85,824,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=448/500000] + train/ActionL1Loss=0.1072 + throughput/total_tokens=86,016,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=449/500000] + train/ActionL1Loss=0.1144 + throughput/total_tokens=86,208,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=450/500000] + train/ActionL1Loss=0.1220 + throughput/total_tokens=86,400,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=451/500000] + train/ActionL1Loss=0.0976 + throughput/total_tokens=86,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=452/500000] + train/ActionL1Loss=0.1229 + throughput/total_tokens=86,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=453/500000] + train/ActionL1Loss=0.1163 + throughput/total_tokens=86,976,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=454/500000] + train/ActionL1Loss=0.1282 + throughput/total_tokens=87,168,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=455/500000] + train/ActionL1Loss=0.1225 + throughput/total_tokens=87,360,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=456/500000] + train/ActionL1Loss=0.1145 + throughput/total_tokens=87,552,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=457/500000] + train/ActionL1Loss=0.1077 + throughput/total_tokens=87,744,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=458/500000] + train/ActionL1Loss=0.1273 + throughput/total_tokens=87,936,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=459/500000] + train/ActionL1Loss=0.1185 + throughput/total_tokens=88,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=460/500000] + optim/total_grad_norm=16.45 + train/ActionL1Loss=0.1054 + throughput/total_tokens=88,320,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=461/500000] + train/ActionL1Loss=0.1036 + throughput/total_tokens=88,512,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=462/500000] + train/ActionL1Loss=0.1175 + throughput/total_tokens=88,704,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=463/500000] + train/ActionL1Loss=0.1066 + throughput/total_tokens=88,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=464/500000] + train/ActionL1Loss=0.1135 + throughput/total_tokens=89,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=465/500000] + train/ActionL1Loss=0.1265 + throughput/total_tokens=89,280,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=466/500000] + train/ActionL1Loss=0.1171 + throughput/total_tokens=89,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=467/500000] + train/ActionL1Loss=0.1072 + throughput/total_tokens=89,664,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=468/500000] + train/ActionL1Loss=0.1123 + throughput/total_tokens=89,856,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=469/500000] + train/ActionL1Loss=0.1224 + throughput/total_tokens=90,048,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=470/500000] + train/ActionL1Loss=0.1174 + throughput/total_tokens=90,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=471/500000] + train/ActionL1Loss=0.1062 + throughput/total_tokens=90,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=472/500000] + train/ActionL1Loss=0.1187 + throughput/total_tokens=90,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=473/500000] + train/ActionL1Loss=0.1197 + throughput/total_tokens=90,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=474/500000] + train/ActionL1Loss=0.1065 + throughput/total_tokens=91,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=475/500000] + train/ActionL1Loss=0.1089 + throughput/total_tokens=91,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=476/500000] + train/ActionL1Loss=0.1183 + throughput/total_tokens=91,392,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=477/500000] + train/ActionL1Loss=0.1190 + throughput/total_tokens=91,584,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=478/500000] + train/ActionL1Loss=0.1148 + throughput/total_tokens=91,776,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=479/500000] + train/ActionL1Loss=0.1216 + throughput/total_tokens=91,968,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=480/500000] + optim/total_grad_norm=18.33 + train/ActionL1Loss=0.1303 + throughput/total_tokens=92,160,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=481/500000] + train/ActionL1Loss=0.1116 + throughput/total_tokens=92,352,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=482/500000] + train/ActionL1Loss=0.0936 + throughput/total_tokens=92,544,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=483/500000] + train/ActionL1Loss=0.1194 + throughput/total_tokens=92,736,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=484/500000] + train/ActionL1Loss=0.1303 + throughput/total_tokens=92,928,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=485/500000] + train/ActionL1Loss=0.1193 + throughput/total_tokens=93,120,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=486/500000] + train/ActionL1Loss=0.1125 + throughput/total_tokens=93,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=487/500000] + train/ActionL1Loss=0.1197 + throughput/total_tokens=93,504,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=488/500000] + train/ActionL1Loss=0.1182 + throughput/total_tokens=93,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=489/500000] + train/ActionL1Loss=0.1284 + throughput/total_tokens=93,888,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=490/500000] + train/ActionL1Loss=0.1120 + throughput/total_tokens=94,080,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=491/500000] + train/ActionL1Loss=0.1172 + throughput/total_tokens=94,272,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=492/500000] + train/ActionL1Loss=0.0965 + throughput/total_tokens=94,464,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=493/500000] + train/ActionL1Loss=0.1040 + throughput/total_tokens=94,656,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=494/500000] + train/ActionL1Loss=0.1139 + throughput/total_tokens=94,848,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=495/500000] + train/ActionL1Loss=0.1107 + throughput/total_tokens=95,040,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=496/500000] + train/ActionL1Loss=0.1161 + throughput/total_tokens=95,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=497/500000] + train/ActionL1Loss=0.1351 + throughput/total_tokens=95,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=498/500000] + train/ActionL1Loss=0.1214 + throughput/total_tokens=95,616,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=499/500000] + train/ActionL1Loss=0.0964 + throughput/total_tokens=95,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=500/500000] + optim/total_grad_norm=18.95 + train/ActionL1Loss=0.1110 + throughput/total_tokens=96,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +10/11 [19:31:14] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/fully_sharded_data_parallel.py:678: warnings.py:109 + FutureWarning: FSDP.state_dict_type() and FSDP.set_state_dict_type() are being deprecated. Please use APIs, get_state_dict() and + set_state_dict(), which can support different parallelisms, FSDP1, FSDP2, DDP. API doc: + https://pytorch.org/docs/stable/distributed.checkpoint.html#torch.distributed.checkpoint.state_dict.get_state_dict .Tutorial: + https://pytorch.org/tutorials/recipes/distributed_checkpoint_recipe.html . + warnings.warn( + + WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/distributed_c10d.py:860: UserWarning: warnings.py:109 + `_get_pg_default_device` will be deprecated, it only stays for backward-compatiblity reason. If you need to find a device for object + collectives, please use `_get_object_coll_device`. If you need to query the device types supported by group, please use + `_device_capability(group)`. + warnings.warn( + +10/11 [19:31:16] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:722: FutureWarning: warnings.py:109 + Please use DTensor instead and we are deprecating ShardedTensor. + local_shape = tensor.shape + + WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:739: FutureWarning: warnings.py:109 + Please use DTensor instead and we are deprecating ShardedTensor. + tensor.shape, + + WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/distributed/fsdp/_state_dict_utils.py:741: FutureWarning: warnings.py:109 + Please use DTensor instead and we are deprecating ShardedTensor. + tensor.dtype, + +10/11 [19:31:20] WARNING | >> /vast/users/xiaodan/miniconda3/envs/a1/lib/python3.10/site-packages/torch/overrides.py:1747: FutureWarning: Please use DTensor warnings.py:109 + instead and we are deprecating ShardedTensor. + result = torch_func_method(public_api, types, args, kwargs) + +10/11 [19:31:49] INFO | >> Saving config... checkpoint.py:608 +10/11 [19:32:27] INFO | >> Saving model state... checkpoint.py:796 +10/11 [19:33:39] INFO | >> Saving optim state... checkpoint.py:811 +10/11 [19:35:10] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=501/500000] + train/ActionL1Loss=0.1109 + throughput/total_tokens=96,192,000 + throughput/device/tokens_per_second=1,209 + throughput/device/batches_per_second=0.0504 +[step=502/500000] + train/ActionL1Loss=0.0986 + throughput/total_tokens=96,384,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=503/500000] + train/ActionL1Loss=0.1063 + throughput/total_tokens=96,576,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=504/500000] + train/ActionL1Loss=0.1239 + throughput/total_tokens=96,768,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=505/500000] + train/ActionL1Loss=0.1196 + throughput/total_tokens=96,960,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=506/500000] + train/ActionL1Loss=0.1155 + throughput/total_tokens=97,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=507/500000] + train/ActionL1Loss=0.1163 + throughput/total_tokens=97,344,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=508/500000] + train/ActionL1Loss=0.0996 + throughput/total_tokens=97,536,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=509/500000] + train/ActionL1Loss=0.1282 + throughput/total_tokens=97,728,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=510/500000] + train/ActionL1Loss=0.1211 + throughput/total_tokens=97,920,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=511/500000] + train/ActionL1Loss=0.1155 + throughput/total_tokens=98,112,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=512/500000] + train/ActionL1Loss=0.1147 + throughput/total_tokens=98,304,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=513/500000] + train/ActionL1Loss=0.1169 + throughput/total_tokens=98,496,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=514/500000] + train/ActionL1Loss=0.1204 + throughput/total_tokens=98,688,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=515/500000] + train/ActionL1Loss=0.1139 + throughput/total_tokens=98,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=516/500000] + train/ActionL1Loss=0.1157 + throughput/total_tokens=99,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=517/500000] + train/ActionL1Loss=0.1098 + throughput/total_tokens=99,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=518/500000] + train/ActionL1Loss=0.1176 + throughput/total_tokens=99,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=519/500000] + train/ActionL1Loss=0.1232 + throughput/total_tokens=99,648,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=520/500000] + optim/total_grad_norm=16.56 + train/ActionL1Loss=0.1203 + throughput/total_tokens=99,840,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=521/500000] + train/ActionL1Loss=0.1183 + throughput/total_tokens=100,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=522/500000] + train/ActionL1Loss=0.1108 + throughput/total_tokens=100,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=523/500000] + train/ActionL1Loss=0.1219 + throughput/total_tokens=100,416,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=524/500000] + train/ActionL1Loss=0.1222 + throughput/total_tokens=100,608,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=525/500000] + train/ActionL1Loss=0.1180 + throughput/total_tokens=100,800,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=526/500000] + train/ActionL1Loss=0.1134 + throughput/total_tokens=100,992,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=527/500000] + train/ActionL1Loss=0.1188 + throughput/total_tokens=101,184,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=528/500000] + train/ActionL1Loss=0.1177 + throughput/total_tokens=101,376,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=529/500000] + train/ActionL1Loss=0.1259 + throughput/total_tokens=101,568,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=530/500000] + train/ActionL1Loss=0.1173 + throughput/total_tokens=101,760,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=531/500000] + train/ActionL1Loss=0.1063 + throughput/total_tokens=101,952,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=532/500000] + train/ActionL1Loss=0.1110 + throughput/total_tokens=102,144,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=533/500000] + train/ActionL1Loss=0.1106 + throughput/total_tokens=102,336,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=534/500000] + train/ActionL1Loss=0.1271 + throughput/total_tokens=102,528,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=535/500000] + train/ActionL1Loss=0.1050 + throughput/total_tokens=102,720,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=536/500000] + train/ActionL1Loss=0.1125 + throughput/total_tokens=102,912,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=537/500000] + train/ActionL1Loss=0.1039 + throughput/total_tokens=103,104,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=538/500000] + train/ActionL1Loss=0.1131 + throughput/total_tokens=103,296,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=539/500000] + train/ActionL1Loss=0.1103 + throughput/total_tokens=103,488,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=540/500000] + optim/total_grad_norm=15.98 + train/ActionL1Loss=0.1097 + throughput/total_tokens=103,680,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=541/500000] + train/ActionL1Loss=0.1041 + throughput/total_tokens=103,872,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=542/500000] + train/ActionL1Loss=0.1156 + throughput/total_tokens=104,064,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=543/500000] + train/ActionL1Loss=0.1015 + throughput/total_tokens=104,256,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=544/500000] + train/ActionL1Loss=0.0961 + throughput/total_tokens=104,448,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=545/500000] + train/ActionL1Loss=0.1121 + throughput/total_tokens=104,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=546/500000] + train/ActionL1Loss=0.1121 + throughput/total_tokens=104,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=547/500000] + train/ActionL1Loss=0.1112 + throughput/total_tokens=105,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=548/500000] + train/ActionL1Loss=0.1041 + throughput/total_tokens=105,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=549/500000] + train/ActionL1Loss=0.0951 + throughput/total_tokens=105,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=550/500000] + train/ActionL1Loss=0.0867 + throughput/total_tokens=105,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=551/500000] + train/ActionL1Loss=0.1024 + throughput/total_tokens=105,792,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=552/500000] + train/ActionL1Loss=0.1089 + throughput/total_tokens=105,984,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=553/500000] + train/ActionL1Loss=0.1193 + throughput/total_tokens=106,176,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=554/500000] + train/ActionL1Loss=0.1155 + throughput/total_tokens=106,368,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=555/500000] + train/ActionL1Loss=0.0959 + throughput/total_tokens=106,560,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=556/500000] + train/ActionL1Loss=0.1110 + throughput/total_tokens=106,752,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=557/500000] + train/ActionL1Loss=0.1083 + throughput/total_tokens=106,944,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=558/500000] + train/ActionL1Loss=0.1107 + throughput/total_tokens=107,136,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=559/500000] + train/ActionL1Loss=0.0980 + throughput/total_tokens=107,328,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=560/500000] + optim/total_grad_norm=15.92 + train/ActionL1Loss=0.1041 + throughput/total_tokens=107,520,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=561/500000] + train/ActionL1Loss=0.1129 + throughput/total_tokens=107,712,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=562/500000] + train/ActionL1Loss=0.0949 + throughput/total_tokens=107,904,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=563/500000] + train/ActionL1Loss=0.0915 + throughput/total_tokens=108,096,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=564/500000] + train/ActionL1Loss=0.0875 + throughput/total_tokens=108,288,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=565/500000] + train/ActionL1Loss=0.1023 + throughput/total_tokens=108,480,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=566/500000] + train/ActionL1Loss=0.1050 + throughput/total_tokens=108,672,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=567/500000] + train/ActionL1Loss=0.1233 + throughput/total_tokens=108,864,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=568/500000] + train/ActionL1Loss=0.1169 + throughput/total_tokens=109,056,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=569/500000] + train/ActionL1Loss=0.1158 + throughput/total_tokens=109,248,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=570/500000] + train/ActionL1Loss=0.1028 + throughput/total_tokens=109,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=571/500000] + train/ActionL1Loss=0.1237 + throughput/total_tokens=109,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=572/500000] + train/ActionL1Loss=0.1178 + throughput/total_tokens=109,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=573/500000] + train/ActionL1Loss=0.1189 + throughput/total_tokens=110,016,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=574/500000] + train/ActionL1Loss=0.1074 + throughput/total_tokens=110,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=575/500000] + train/ActionL1Loss=0.1293 + throughput/total_tokens=110,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=576/500000] + train/ActionL1Loss=0.1227 + throughput/total_tokens=110,592,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=577/500000] + train/ActionL1Loss=0.1009 + throughput/total_tokens=110,784,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=578/500000] + train/ActionL1Loss=0.1089 + throughput/total_tokens=110,976,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=579/500000] + train/ActionL1Loss=0.1097 + throughput/total_tokens=111,168,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=580/500000] + optim/total_grad_norm=18.10 + train/ActionL1Loss=0.1297 + throughput/total_tokens=111,360,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=581/500000] + train/ActionL1Loss=0.1100 + throughput/total_tokens=111,552,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=582/500000] + train/ActionL1Loss=0.1128 + throughput/total_tokens=111,744,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=583/500000] + train/ActionL1Loss=0.0962 + throughput/total_tokens=111,936,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=584/500000] + train/ActionL1Loss=0.1148 + throughput/total_tokens=112,128,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=585/500000] + train/ActionL1Loss=0.1104 + throughput/total_tokens=112,320,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=586/500000] + train/ActionL1Loss=0.1264 + throughput/total_tokens=112,512,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=587/500000] + train/ActionL1Loss=0.1166 + throughput/total_tokens=112,704,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=588/500000] + train/ActionL1Loss=0.1273 + throughput/total_tokens=112,896,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=589/500000] + train/ActionL1Loss=0.1218 + throughput/total_tokens=113,088,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=590/500000] + train/ActionL1Loss=0.1121 + throughput/total_tokens=113,280,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=591/500000] + train/ActionL1Loss=0.1188 + throughput/total_tokens=113,472,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=592/500000] + train/ActionL1Loss=0.1136 + throughput/total_tokens=113,664,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=593/500000] + train/ActionL1Loss=0.1006 + throughput/total_tokens=113,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=594/500000] + train/ActionL1Loss=0.1301 + throughput/total_tokens=114,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=595/500000] + train/ActionL1Loss=0.1237 + throughput/total_tokens=114,240,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=596/500000] + train/ActionL1Loss=0.1196 + throughput/total_tokens=114,432,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=597/500000] + train/ActionL1Loss=0.1207 + throughput/total_tokens=114,624,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=598/500000] + train/ActionL1Loss=0.1269 + throughput/total_tokens=114,816,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=599/500000] + train/ActionL1Loss=0.1130 + throughput/total_tokens=115,008,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=600/500000] + optim/total_grad_norm=16.94 + train/ActionL1Loss=0.1028 + throughput/total_tokens=115,200,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=601/500000] + train/ActionL1Loss=0.0923 + throughput/total_tokens=115,392,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=602/500000] + train/ActionL1Loss=0.0987 + throughput/total_tokens=115,584,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=603/500000] + train/ActionL1Loss=0.0913 + throughput/total_tokens=115,776,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=604/500000] + train/ActionL1Loss=0.0903 + throughput/total_tokens=115,968,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=605/500000] + train/ActionL1Loss=0.1105 + throughput/total_tokens=116,160,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=606/500000] + train/ActionL1Loss=0.0889 + throughput/total_tokens=116,352,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=607/500000] + train/ActionL1Loss=0.1144 + throughput/total_tokens=116,544,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=608/500000] + train/ActionL1Loss=0.1166 + throughput/total_tokens=116,736,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=609/500000] + train/ActionL1Loss=0.0973 + throughput/total_tokens=116,928,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=610/500000] + train/ActionL1Loss=0.1253 + throughput/total_tokens=117,120,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 + System/Peak GPU Memory (MB)=46,924 +[step=611/500000] + train/ActionL1Loss=0.1270 + throughput/total_tokens=117,312,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=612/500000] + train/ActionL1Loss=0.1027 + throughput/total_tokens=117,504,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=613/500000] + train/ActionL1Loss=0.1014 + throughput/total_tokens=117,696,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=614/500000] + train/ActionL1Loss=0.1119 + throughput/total_tokens=117,888,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=615/500000] + train/ActionL1Loss=0.0901 + throughput/total_tokens=118,080,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=616/500000] + train/ActionL1Loss=0.1133 + throughput/total_tokens=118,272,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=617/500000] + train/ActionL1Loss=0.1136 + throughput/total_tokens=118,464,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=618/500000] + train/ActionL1Loss=0.1147 + throughput/total_tokens=118,656,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=619/500000] + train/ActionL1Loss=0.1144 + throughput/total_tokens=118,848,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=620/500000] + optim/total_grad_norm=14.77 + train/ActionL1Loss=0.1016 + throughput/total_tokens=119,040,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=621/500000] + train/ActionL1Loss=0.1047 + throughput/total_tokens=119,232,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=622/500000] + train/ActionL1Loss=0.1211 + throughput/total_tokens=119,424,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=623/500000] + train/ActionL1Loss=0.1146 + throughput/total_tokens=119,616,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=624/500000] + train/ActionL1Loss=0.1090 + throughput/total_tokens=119,808,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=625/500000] + train/ActionL1Loss=0.1168 + throughput/total_tokens=120,000,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=626/500000] + train/ActionL1Loss=0.1130 + throughput/total_tokens=120,192,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=627/500000] + train/ActionL1Loss=0.1155 + throughput/total_tokens=120,384,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=628/500000] + train/ActionL1Loss=0.0940 + throughput/total_tokens=120,576,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=629/500000] + train/ActionL1Loss=0.1021 + throughput/total_tokens=120,768,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=630/500000] + train/ActionL1Loss=0.1039 + throughput/total_tokens=120,960,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=631/500000] + train/ActionL1Loss=0.1037 + throughput/total_tokens=121,152,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=632/500000] + train/ActionL1Loss=0.1278 + throughput/total_tokens=121,344,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=633/500000] + train/ActionL1Loss=0.1218 + throughput/total_tokens=121,536,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=634/500000] + train/ActionL1Loss=0.0943 + throughput/total_tokens=121,728,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=635/500000] + train/ActionL1Loss=0.1142 + throughput/total_tokens=121,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=636/500000] + train/ActionL1Loss=0.1286 + throughput/total_tokens=122,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=637/500000] + train/ActionL1Loss=0.1029 + throughput/total_tokens=122,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=638/500000] + train/ActionL1Loss=0.1015 + throughput/total_tokens=122,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=639/500000] + train/ActionL1Loss=0.1227 + throughput/total_tokens=122,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=640/500000] + optim/total_grad_norm=15.35 + train/ActionL1Loss=0.1096 + throughput/total_tokens=122,880,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=641/500000] + train/ActionL1Loss=0.0961 + throughput/total_tokens=123,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=642/500000] + train/ActionL1Loss=0.1081 + throughput/total_tokens=123,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=643/500000] + train/ActionL1Loss=0.1138 + throughput/total_tokens=123,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=644/500000] + train/ActionL1Loss=0.1052 + throughput/total_tokens=123,648,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=645/500000] + train/ActionL1Loss=0.1045 + throughput/total_tokens=123,840,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=646/500000] + train/ActionL1Loss=0.1052 + throughput/total_tokens=124,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=647/500000] + train/ActionL1Loss=0.1019 + throughput/total_tokens=124,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=648/500000] + train/ActionL1Loss=0.1090 + throughput/total_tokens=124,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=649/500000] + train/ActionL1Loss=0.1015 + throughput/total_tokens=124,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=650/500000] + train/ActionL1Loss=0.0964 + throughput/total_tokens=124,800,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=651/500000] + train/ActionL1Loss=0.0902 + throughput/total_tokens=124,992,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=652/500000] + train/ActionL1Loss=0.1033 + throughput/total_tokens=125,184,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=653/500000] + train/ActionL1Loss=0.0945 + throughput/total_tokens=125,376,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=654/500000] + train/ActionL1Loss=0.0914 + throughput/total_tokens=125,568,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=655/500000] + train/ActionL1Loss=0.1065 + throughput/total_tokens=125,760,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=656/500000] + train/ActionL1Loss=0.0982 + throughput/total_tokens=125,952,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=657/500000] + train/ActionL1Loss=0.1016 + throughput/total_tokens=126,144,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=658/500000] + train/ActionL1Loss=0.1122 + throughput/total_tokens=126,336,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=659/500000] + train/ActionL1Loss=0.0989 + throughput/total_tokens=126,528,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=660/500000] + optim/total_grad_norm=14.47 + train/ActionL1Loss=0.0928 + throughput/total_tokens=126,720,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=661/500000] + train/ActionL1Loss=0.1208 + throughput/total_tokens=126,912,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=662/500000] + train/ActionL1Loss=0.1044 + throughput/total_tokens=127,104,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=663/500000] + train/ActionL1Loss=0.1088 + throughput/total_tokens=127,296,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=664/500000] + train/ActionL1Loss=0.1192 + throughput/total_tokens=127,488,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=665/500000] + train/ActionL1Loss=0.1113 + throughput/total_tokens=127,680,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=666/500000] + train/ActionL1Loss=0.1336 + throughput/total_tokens=127,872,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=667/500000] + train/ActionL1Loss=0.1195 + throughput/total_tokens=128,064,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=668/500000] + train/ActionL1Loss=0.1028 + throughput/total_tokens=128,256,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=669/500000] + train/ActionL1Loss=0.1079 + throughput/total_tokens=128,448,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=670/500000] + train/ActionL1Loss=0.1257 + throughput/total_tokens=128,640,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=671/500000] + train/ActionL1Loss=0.1122 + throughput/total_tokens=128,832,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=672/500000] + train/ActionL1Loss=0.0962 + throughput/total_tokens=129,024,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=673/500000] + train/ActionL1Loss=0.1108 + throughput/total_tokens=129,216,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=674/500000] + train/ActionL1Loss=0.1037 + throughput/total_tokens=129,408,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=675/500000] + train/ActionL1Loss=0.1264 + throughput/total_tokens=129,600,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=676/500000] + train/ActionL1Loss=0.0998 + throughput/total_tokens=129,792,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=677/500000] + train/ActionL1Loss=0.0956 + throughput/total_tokens=129,984,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=678/500000] + train/ActionL1Loss=0.1148 + throughput/total_tokens=130,176,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=679/500000] + train/ActionL1Loss=0.1291 + throughput/total_tokens=130,368,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=680/500000] + optim/total_grad_norm=13.53 + train/ActionL1Loss=0.0999 + throughput/total_tokens=130,560,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=681/500000] + train/ActionL1Loss=0.1048 + throughput/total_tokens=130,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=682/500000] + train/ActionL1Loss=0.0974 + throughput/total_tokens=130,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=683/500000] + train/ActionL1Loss=0.1129 + throughput/total_tokens=131,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=684/500000] + train/ActionL1Loss=0.1046 + throughput/total_tokens=131,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=685/500000] + train/ActionL1Loss=0.0985 + throughput/total_tokens=131,520,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=686/500000] + train/ActionL1Loss=0.1074 + throughput/total_tokens=131,712,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=687/500000] + train/ActionL1Loss=0.1026 + throughput/total_tokens=131,904,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=688/500000] + train/ActionL1Loss=0.1148 + throughput/total_tokens=132,096,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=689/500000] + train/ActionL1Loss=0.0971 + throughput/total_tokens=132,288,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=690/500000] + train/ActionL1Loss=0.1056 + throughput/total_tokens=132,480,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=691/500000] + train/ActionL1Loss=0.0922 + throughput/total_tokens=132,672,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=692/500000] + train/ActionL1Loss=0.1033 + throughput/total_tokens=132,864,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=693/500000] + train/ActionL1Loss=0.1024 + throughput/total_tokens=133,056,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=694/500000] + train/ActionL1Loss=0.0946 + throughput/total_tokens=133,248,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=695/500000] + train/ActionL1Loss=0.0948 + throughput/total_tokens=133,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=696/500000] + train/ActionL1Loss=0.0971 + throughput/total_tokens=133,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=697/500000] + train/ActionL1Loss=0.1052 + throughput/total_tokens=133,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=698/500000] + train/ActionL1Loss=0.0987 + throughput/total_tokens=134,016,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=699/500000] + train/ActionL1Loss=0.1163 + throughput/total_tokens=134,208,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=700/500000] + optim/total_grad_norm=16.24 + train/ActionL1Loss=0.1027 + throughput/total_tokens=134,400,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=701/500000] + train/ActionL1Loss=0.1049 + throughput/total_tokens=134,592,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=702/500000] + train/ActionL1Loss=0.0983 + throughput/total_tokens=134,784,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=703/500000] + train/ActionL1Loss=0.0989 + throughput/total_tokens=134,976,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=704/500000] + train/ActionL1Loss=0.1224 + throughput/total_tokens=135,168,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=705/500000] + train/ActionL1Loss=0.1013 + throughput/total_tokens=135,360,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=706/500000] + train/ActionL1Loss=0.0962 + throughput/total_tokens=135,552,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=707/500000] + train/ActionL1Loss=0.0950 + throughput/total_tokens=135,744,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=708/500000] + train/ActionL1Loss=0.1130 + throughput/total_tokens=135,936,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=709/500000] + train/ActionL1Loss=0.1136 + throughput/total_tokens=136,128,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=710/500000] + train/ActionL1Loss=0.0913 + throughput/total_tokens=136,320,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 + System/Peak GPU Memory (MB)=46,924 +[step=711/500000] + train/ActionL1Loss=0.1013 + throughput/total_tokens=136,512,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=712/500000] + train/ActionL1Loss=0.1149 + throughput/total_tokens=136,704,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=713/500000] + train/ActionL1Loss=0.1119 + throughput/total_tokens=136,896,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=714/500000] + train/ActionL1Loss=0.1098 + throughput/total_tokens=137,088,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=715/500000] + train/ActionL1Loss=0.0931 + throughput/total_tokens=137,280,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=716/500000] + train/ActionL1Loss=0.1176 + throughput/total_tokens=137,472,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=717/500000] + train/ActionL1Loss=0.1117 + throughput/total_tokens=137,664,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=718/500000] + train/ActionL1Loss=0.1072 + throughput/total_tokens=137,856,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=719/500000] + train/ActionL1Loss=0.1073 + throughput/total_tokens=138,048,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=720/500000] + optim/total_grad_norm=16.58 + train/ActionL1Loss=0.1109 + throughput/total_tokens=138,240,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=721/500000] + train/ActionL1Loss=0.1193 + throughput/total_tokens=138,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=722/500000] + train/ActionL1Loss=0.1022 + throughput/total_tokens=138,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=723/500000] + train/ActionL1Loss=0.1267 + throughput/total_tokens=138,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=724/500000] + train/ActionL1Loss=0.1110 + throughput/total_tokens=139,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=725/500000] + train/ActionL1Loss=0.1011 + throughput/total_tokens=139,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=726/500000] + train/ActionL1Loss=0.1020 + throughput/total_tokens=139,392,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=727/500000] + train/ActionL1Loss=0.1118 + throughput/total_tokens=139,584,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=728/500000] + train/ActionL1Loss=0.1112 + throughput/total_tokens=139,776,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=729/500000] + train/ActionL1Loss=0.1176 + throughput/total_tokens=139,968,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=730/500000] + train/ActionL1Loss=0.0914 + throughput/total_tokens=140,160,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=731/500000] + train/ActionL1Loss=0.0953 + throughput/total_tokens=140,352,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=732/500000] + train/ActionL1Loss=0.1002 + throughput/total_tokens=140,544,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=733/500000] + train/ActionL1Loss=0.0936 + throughput/total_tokens=140,736,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=734/500000] + train/ActionL1Loss=0.1006 + throughput/total_tokens=140,928,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=735/500000] + train/ActionL1Loss=0.1044 + throughput/total_tokens=141,120,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=736/500000] + train/ActionL1Loss=0.0955 + throughput/total_tokens=141,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=737/500000] + train/ActionL1Loss=0.0949 + throughput/total_tokens=141,504,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=738/500000] + train/ActionL1Loss=0.0834 + throughput/total_tokens=141,696,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=739/500000] + train/ActionL1Loss=0.1005 + throughput/total_tokens=141,888,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=740/500000] + optim/total_grad_norm=11.96 + train/ActionL1Loss=0.0983 + throughput/total_tokens=142,080,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=741/500000] + train/ActionL1Loss=0.0936 + throughput/total_tokens=142,272,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=742/500000] + train/ActionL1Loss=0.1042 + throughput/total_tokens=142,464,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=743/500000] + train/ActionL1Loss=0.1063 + throughput/total_tokens=142,656,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=744/500000] + train/ActionL1Loss=0.0908 + throughput/total_tokens=142,848,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=745/500000] + train/ActionL1Loss=0.1054 + throughput/total_tokens=143,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=746/500000] + train/ActionL1Loss=0.1056 + throughput/total_tokens=143,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=747/500000] + train/ActionL1Loss=0.0963 + throughput/total_tokens=143,424,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=748/500000] + train/ActionL1Loss=0.0701 + throughput/total_tokens=143,616,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=749/500000] + train/ActionL1Loss=0.0983 + throughput/total_tokens=143,808,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=750/500000] + train/ActionL1Loss=0.1112 + throughput/total_tokens=144,000,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=751/500000] + train/ActionL1Loss=0.1011 + throughput/total_tokens=144,192,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=752/500000] + train/ActionL1Loss=0.0855 + throughput/total_tokens=144,384,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=753/500000] + train/ActionL1Loss=0.1056 + throughput/total_tokens=144,576,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=754/500000] + train/ActionL1Loss=0.0968 + throughput/total_tokens=144,768,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=755/500000] + train/ActionL1Loss=0.1042 + throughput/total_tokens=144,960,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=756/500000] + train/ActionL1Loss=0.1022 + throughput/total_tokens=145,152,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=757/500000] + train/ActionL1Loss=0.1006 + throughput/total_tokens=145,344,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=758/500000] + train/ActionL1Loss=0.1043 + throughput/total_tokens=145,536,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=759/500000] + train/ActionL1Loss=0.0980 + throughput/total_tokens=145,728,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=760/500000] + optim/total_grad_norm=14.93 + train/ActionL1Loss=0.1097 + throughput/total_tokens=145,920,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 + System/Peak GPU Memory (MB)=46,924 +[step=761/500000] + train/ActionL1Loss=0.1031 + throughput/total_tokens=146,112,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=762/500000] + train/ActionL1Loss=0.1118 + throughput/total_tokens=146,304,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=763/500000] + train/ActionL1Loss=0.0996 + throughput/total_tokens=146,496,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=764/500000] + train/ActionL1Loss=0.0876 + throughput/total_tokens=146,688,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=765/500000] + train/ActionL1Loss=0.1029 + throughput/total_tokens=146,880,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=766/500000] + train/ActionL1Loss=0.0909 + throughput/total_tokens=147,072,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=767/500000] + train/ActionL1Loss=0.0830 + throughput/total_tokens=147,264,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=768/500000] + train/ActionL1Loss=0.0942 + throughput/total_tokens=147,456,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=769/500000] + train/ActionL1Loss=0.0937 + throughput/total_tokens=147,648,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=770/500000] + train/ActionL1Loss=0.0982 + throughput/total_tokens=147,840,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=771/500000] + train/ActionL1Loss=0.0931 + throughput/total_tokens=148,032,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=772/500000] + train/ActionL1Loss=0.0948 + throughput/total_tokens=148,224,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=773/500000] + train/ActionL1Loss=0.0971 + throughput/total_tokens=148,416,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=774/500000] + train/ActionL1Loss=0.0993 + throughput/total_tokens=148,608,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=775/500000] + train/ActionL1Loss=0.1026 + throughput/total_tokens=148,800,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=776/500000] + train/ActionL1Loss=0.1019 + throughput/total_tokens=148,992,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=777/500000] + train/ActionL1Loss=0.1175 + throughput/total_tokens=149,184,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=778/500000] + train/ActionL1Loss=0.1214 + throughput/total_tokens=149,376,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=779/500000] + train/ActionL1Loss=0.0964 + throughput/total_tokens=149,568,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=780/500000] + optim/total_grad_norm=12.62 + train/ActionL1Loss=0.1039 + throughput/total_tokens=149,760,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=781/500000] + train/ActionL1Loss=0.1068 + throughput/total_tokens=149,952,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=782/500000] + train/ActionL1Loss=0.1000 + throughput/total_tokens=150,144,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=783/500000] + train/ActionL1Loss=0.0852 + throughput/total_tokens=150,336,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=784/500000] + train/ActionL1Loss=0.0944 + throughput/total_tokens=150,528,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=785/500000] + train/ActionL1Loss=0.0880 + throughput/total_tokens=150,720,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=786/500000] + train/ActionL1Loss=0.0843 + throughput/total_tokens=150,912,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=787/500000] + train/ActionL1Loss=0.0951 + throughput/total_tokens=151,104,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=788/500000] + train/ActionL1Loss=0.1051 + throughput/total_tokens=151,296,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=789/500000] + train/ActionL1Loss=0.0995 + throughput/total_tokens=151,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=790/500000] + train/ActionL1Loss=0.0775 + throughput/total_tokens=151,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=791/500000] + train/ActionL1Loss=0.1025 + throughput/total_tokens=151,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=792/500000] + train/ActionL1Loss=0.0969 + throughput/total_tokens=152,064,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=793/500000] + train/ActionL1Loss=0.1135 + throughput/total_tokens=152,256,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=794/500000] + train/ActionL1Loss=0.1062 + throughput/total_tokens=152,448,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=795/500000] + train/ActionL1Loss=0.1101 + throughput/total_tokens=152,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=796/500000] + train/ActionL1Loss=0.1108 + throughput/total_tokens=152,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=797/500000] + train/ActionL1Loss=0.1034 + throughput/total_tokens=153,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=798/500000] + train/ActionL1Loss=0.1085 + throughput/total_tokens=153,216,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=799/500000] + train/ActionL1Loss=0.0794 + throughput/total_tokens=153,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=800/500000] + optim/total_grad_norm=13.44 + train/ActionL1Loss=0.0890 + throughput/total_tokens=153,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=801/500000] + train/ActionL1Loss=0.1063 + throughput/total_tokens=153,792,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=802/500000] + train/ActionL1Loss=0.1005 + throughput/total_tokens=153,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=803/500000] + train/ActionL1Loss=0.0980 + throughput/total_tokens=154,176,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=804/500000] + train/ActionL1Loss=0.0876 + throughput/total_tokens=154,368,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=805/500000] + train/ActionL1Loss=0.1121 + throughput/total_tokens=154,560,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=806/500000] + train/ActionL1Loss=0.0985 + throughput/total_tokens=154,752,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=807/500000] + train/ActionL1Loss=0.1085 + throughput/total_tokens=154,944,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=808/500000] + train/ActionL1Loss=0.1098 + throughput/total_tokens=155,136,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=809/500000] + train/ActionL1Loss=0.0922 + throughput/total_tokens=155,328,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=810/500000] + train/ActionL1Loss=0.1136 + throughput/total_tokens=155,520,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=811/500000] + train/ActionL1Loss=0.1134 + throughput/total_tokens=155,712,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=812/500000] + train/ActionL1Loss=0.1096 + throughput/total_tokens=155,904,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=813/500000] + train/ActionL1Loss=0.0950 + throughput/total_tokens=156,096,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=814/500000] + train/ActionL1Loss=0.1074 + throughput/total_tokens=156,288,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=815/500000] + train/ActionL1Loss=0.1040 + throughput/total_tokens=156,480,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=816/500000] + train/ActionL1Loss=0.0966 + throughput/total_tokens=156,672,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=817/500000] + train/ActionL1Loss=0.0978 + throughput/total_tokens=156,864,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=818/500000] + train/ActionL1Loss=0.1008 + throughput/total_tokens=157,056,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=819/500000] + train/ActionL1Loss=0.0934 + throughput/total_tokens=157,248,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=820/500000] + optim/total_grad_norm=13.23 + train/ActionL1Loss=0.0848 + throughput/total_tokens=157,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=821/500000] + train/ActionL1Loss=0.0936 + throughput/total_tokens=157,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=822/500000] + train/ActionL1Loss=0.0985 + throughput/total_tokens=157,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=823/500000] + train/ActionL1Loss=0.0795 + throughput/total_tokens=158,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=824/500000] + train/ActionL1Loss=0.0854 + throughput/total_tokens=158,208,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=825/500000] + train/ActionL1Loss=0.0921 + throughput/total_tokens=158,400,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=826/500000] + train/ActionL1Loss=0.1044 + throughput/total_tokens=158,592,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=827/500000] + train/ActionL1Loss=0.0951 + throughput/total_tokens=158,784,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=828/500000] + train/ActionL1Loss=0.1046 + throughput/total_tokens=158,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=829/500000] + train/ActionL1Loss=0.0994 + throughput/total_tokens=159,168,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=830/500000] + train/ActionL1Loss=0.0959 + throughput/total_tokens=159,360,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=831/500000] + train/ActionL1Loss=0.1121 + throughput/total_tokens=159,552,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=832/500000] + train/ActionL1Loss=0.1189 + throughput/total_tokens=159,744,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=833/500000] + train/ActionL1Loss=0.1129 + throughput/total_tokens=159,936,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=834/500000] + train/ActionL1Loss=0.1026 + throughput/total_tokens=160,128,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=835/500000] + train/ActionL1Loss=0.1174 + throughput/total_tokens=160,320,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=836/500000] + train/ActionL1Loss=0.1118 + throughput/total_tokens=160,512,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=837/500000] + train/ActionL1Loss=0.0988 + throughput/total_tokens=160,704,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=838/500000] + train/ActionL1Loss=0.1071 + throughput/total_tokens=160,896,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=839/500000] + train/ActionL1Loss=0.0922 + throughput/total_tokens=161,088,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=840/500000] + optim/total_grad_norm=13.46 + train/ActionL1Loss=0.0981 + throughput/total_tokens=161,280,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=841/500000] + train/ActionL1Loss=0.0946 + throughput/total_tokens=161,472,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=842/500000] + train/ActionL1Loss=0.0981 + throughput/total_tokens=161,664,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=843/500000] + train/ActionL1Loss=0.0917 + throughput/total_tokens=161,856,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=844/500000] + train/ActionL1Loss=0.0859 + throughput/total_tokens=162,048,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=845/500000] + train/ActionL1Loss=0.0878 + throughput/total_tokens=162,240,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=846/500000] + train/ActionL1Loss=0.1112 + throughput/total_tokens=162,432,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=847/500000] + train/ActionL1Loss=0.1066 + throughput/total_tokens=162,624,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=848/500000] + train/ActionL1Loss=0.0938 + throughput/total_tokens=162,816,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=849/500000] + train/ActionL1Loss=0.1101 + throughput/total_tokens=163,008,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=850/500000] + train/ActionL1Loss=0.1206 + throughput/total_tokens=163,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=851/500000] + train/ActionL1Loss=0.0759 + throughput/total_tokens=163,392,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=852/500000] + train/ActionL1Loss=0.1042 + throughput/total_tokens=163,584,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=853/500000] + train/ActionL1Loss=0.1114 + throughput/total_tokens=163,776,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=854/500000] + train/ActionL1Loss=0.0985 + throughput/total_tokens=163,968,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=855/500000] + train/ActionL1Loss=0.1006 + throughput/total_tokens=164,160,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=856/500000] + train/ActionL1Loss=0.0917 + throughput/total_tokens=164,352,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=857/500000] + train/ActionL1Loss=0.0846 + throughput/total_tokens=164,544,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=858/500000] + train/ActionL1Loss=0.0980 + throughput/total_tokens=164,736,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=859/500000] + train/ActionL1Loss=0.0981 + throughput/total_tokens=164,928,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=860/500000] + optim/total_grad_norm=12.43 + train/ActionL1Loss=0.0918 + throughput/total_tokens=165,120,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=861/500000] + train/ActionL1Loss=0.0812 + throughput/total_tokens=165,312,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=862/500000] + train/ActionL1Loss=0.1052 + throughput/total_tokens=165,504,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=863/500000] + train/ActionL1Loss=0.0956 + throughput/total_tokens=165,696,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=864/500000] + train/ActionL1Loss=0.0862 + throughput/total_tokens=165,888,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=865/500000] + train/ActionL1Loss=0.0819 + throughput/total_tokens=166,080,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=866/500000] + train/ActionL1Loss=0.1099 + throughput/total_tokens=166,272,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=867/500000] + train/ActionL1Loss=0.1063 + throughput/total_tokens=166,464,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=868/500000] + train/ActionL1Loss=0.0857 + throughput/total_tokens=166,656,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=869/500000] + train/ActionL1Loss=0.0869 + throughput/total_tokens=166,848,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=870/500000] + train/ActionL1Loss=0.1150 + throughput/total_tokens=167,040,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=871/500000] + train/ActionL1Loss=0.1050 + throughput/total_tokens=167,232,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=872/500000] + train/ActionL1Loss=0.1032 + throughput/total_tokens=167,424,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=873/500000] + train/ActionL1Loss=0.1050 + throughput/total_tokens=167,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=874/500000] + train/ActionL1Loss=0.0872 + throughput/total_tokens=167,808,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=875/500000] + train/ActionL1Loss=0.0916 + throughput/total_tokens=168,000,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=876/500000] + train/ActionL1Loss=0.0971 + throughput/total_tokens=168,192,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=877/500000] + train/ActionL1Loss=0.1044 + throughput/total_tokens=168,384,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=878/500000] + train/ActionL1Loss=0.1069 + throughput/total_tokens=168,576,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=879/500000] + train/ActionL1Loss=0.0912 + throughput/total_tokens=168,768,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=880/500000] + optim/total_grad_norm=12.88 + train/ActionL1Loss=0.0992 + throughput/total_tokens=168,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=881/500000] + train/ActionL1Loss=0.1002 + throughput/total_tokens=169,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=882/500000] + train/ActionL1Loss=0.1058 + throughput/total_tokens=169,344,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=883/500000] + train/ActionL1Loss=0.0926 + throughput/total_tokens=169,536,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=884/500000] + train/ActionL1Loss=0.0941 + throughput/total_tokens=169,728,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=885/500000] + train/ActionL1Loss=0.1032 + throughput/total_tokens=169,920,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=886/500000] + train/ActionL1Loss=0.0978 + throughput/total_tokens=170,112,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=887/500000] + train/ActionL1Loss=0.0984 + throughput/total_tokens=170,304,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=888/500000] + train/ActionL1Loss=0.1032 + throughput/total_tokens=170,496,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=889/500000] + train/ActionL1Loss=0.0948 + throughput/total_tokens=170,688,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=890/500000] + train/ActionL1Loss=0.0885 + throughput/total_tokens=170,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=891/500000] + train/ActionL1Loss=0.1221 + throughput/total_tokens=171,072,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=892/500000] + train/ActionL1Loss=0.1158 + throughput/total_tokens=171,264,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=893/500000] + train/ActionL1Loss=0.1192 + throughput/total_tokens=171,456,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=894/500000] + train/ActionL1Loss=0.1128 + throughput/total_tokens=171,648,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=895/500000] + train/ActionL1Loss=0.1095 + throughput/total_tokens=171,840,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=896/500000] + train/ActionL1Loss=0.1169 + throughput/total_tokens=172,032,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=897/500000] + train/ActionL1Loss=0.1002 + throughput/total_tokens=172,224,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=898/500000] + train/ActionL1Loss=0.1000 + throughput/total_tokens=172,416,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=899/500000] + train/ActionL1Loss=0.1078 + throughput/total_tokens=172,608,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=900/500000] + optim/total_grad_norm=14.10 + train/ActionL1Loss=0.1157 + throughput/total_tokens=172,800,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=901/500000] + train/ActionL1Loss=0.0846 + throughput/total_tokens=172,992,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=902/500000] + train/ActionL1Loss=0.0936 + throughput/total_tokens=173,184,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=903/500000] + train/ActionL1Loss=0.1137 + throughput/total_tokens=173,376,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=904/500000] + train/ActionL1Loss=0.1226 + throughput/total_tokens=173,568,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=905/500000] + train/ActionL1Loss=0.0910 + throughput/total_tokens=173,760,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=906/500000] + train/ActionL1Loss=0.1047 + throughput/total_tokens=173,952,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=907/500000] + train/ActionL1Loss=0.0979 + throughput/total_tokens=174,144,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=908/500000] + train/ActionL1Loss=0.0834 + throughput/total_tokens=174,336,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=909/500000] + train/ActionL1Loss=0.0898 + throughput/total_tokens=174,528,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=910/500000] + train/ActionL1Loss=0.1114 + throughput/total_tokens=174,720,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=911/500000] + train/ActionL1Loss=0.1088 + throughput/total_tokens=174,912,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=912/500000] + train/ActionL1Loss=0.1013 + throughput/total_tokens=175,104,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=913/500000] + train/ActionL1Loss=0.0876 + throughput/total_tokens=175,296,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=914/500000] + train/ActionL1Loss=0.0947 + throughput/total_tokens=175,488,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=915/500000] + train/ActionL1Loss=0.1110 + throughput/total_tokens=175,680,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=916/500000] + train/ActionL1Loss=0.0968 + throughput/total_tokens=175,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=917/500000] + train/ActionL1Loss=0.0804 + throughput/total_tokens=176,064,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=918/500000] + train/ActionL1Loss=0.0927 + throughput/total_tokens=176,256,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=919/500000] + train/ActionL1Loss=0.0978 + throughput/total_tokens=176,448,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=920/500000] + optim/total_grad_norm=11.91 + train/ActionL1Loss=0.1019 + throughput/total_tokens=176,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=921/500000] + train/ActionL1Loss=0.1054 + throughput/total_tokens=176,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=922/500000] + train/ActionL1Loss=0.1246 + throughput/total_tokens=177,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=923/500000] + train/ActionL1Loss=0.1051 + throughput/total_tokens=177,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=924/500000] + train/ActionL1Loss=0.1093 + throughput/total_tokens=177,408,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=925/500000] + train/ActionL1Loss=0.1065 + throughput/total_tokens=177,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=926/500000] + train/ActionL1Loss=0.1019 + throughput/total_tokens=177,792,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=927/500000] + train/ActionL1Loss=0.0889 + throughput/total_tokens=177,984,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=928/500000] + train/ActionL1Loss=0.0929 + throughput/total_tokens=178,176,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=929/500000] + train/ActionL1Loss=0.0945 + throughput/total_tokens=178,368,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=930/500000] + train/ActionL1Loss=0.0990 + throughput/total_tokens=178,560,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=931/500000] + train/ActionL1Loss=0.0937 + throughput/total_tokens=178,752,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=932/500000] + train/ActionL1Loss=0.0902 + throughput/total_tokens=178,944,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=933/500000] + train/ActionL1Loss=0.0990 + throughput/total_tokens=179,136,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=934/500000] + train/ActionL1Loss=0.1008 + throughput/total_tokens=179,328,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=935/500000] + train/ActionL1Loss=0.1031 + throughput/total_tokens=179,520,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=936/500000] + train/ActionL1Loss=0.0996 + throughput/total_tokens=179,712,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=937/500000] + train/ActionL1Loss=0.0996 + throughput/total_tokens=179,904,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=938/500000] + train/ActionL1Loss=0.0781 + throughput/total_tokens=180,096,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=939/500000] + train/ActionL1Loss=0.0987 + throughput/total_tokens=180,288,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=940/500000] + optim/total_grad_norm=13.08 + train/ActionL1Loss=0.0983 + throughput/total_tokens=180,480,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=941/500000] + train/ActionL1Loss=0.0919 + throughput/total_tokens=180,672,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=942/500000] + train/ActionL1Loss=0.0911 + throughput/total_tokens=180,864,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=943/500000] + train/ActionL1Loss=0.0901 + throughput/total_tokens=181,056,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=944/500000] + train/ActionL1Loss=0.1130 + throughput/total_tokens=181,248,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=945/500000] + train/ActionL1Loss=0.1038 + throughput/total_tokens=181,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=946/500000] + train/ActionL1Loss=0.0966 + throughput/total_tokens=181,632,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=947/500000] + train/ActionL1Loss=0.0836 + throughput/total_tokens=181,824,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=948/500000] + train/ActionL1Loss=0.0750 + throughput/total_tokens=182,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=949/500000] + train/ActionL1Loss=0.1054 + throughput/total_tokens=182,208,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=950/500000] + train/ActionL1Loss=0.0996 + throughput/total_tokens=182,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=951/500000] + train/ActionL1Loss=0.0919 + throughput/total_tokens=182,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=952/500000] + train/ActionL1Loss=0.1036 + throughput/total_tokens=182,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=953/500000] + train/ActionL1Loss=0.1039 + throughput/total_tokens=182,976,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=954/500000] + train/ActionL1Loss=0.1053 + throughput/total_tokens=183,168,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=955/500000] + train/ActionL1Loss=0.0845 + throughput/total_tokens=183,360,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=956/500000] + train/ActionL1Loss=0.1147 + throughput/total_tokens=183,552,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=957/500000] + train/ActionL1Loss=0.1052 + throughput/total_tokens=183,744,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=958/500000] + train/ActionL1Loss=0.1015 + throughput/total_tokens=183,936,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=959/500000] + train/ActionL1Loss=0.1050 + throughput/total_tokens=184,128,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=960/500000] + optim/total_grad_norm=10.94 + train/ActionL1Loss=0.0955 + throughput/total_tokens=184,320,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=961/500000] + train/ActionL1Loss=0.0956 + throughput/total_tokens=184,512,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=962/500000] + train/ActionL1Loss=0.1010 + throughput/total_tokens=184,704,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=963/500000] + train/ActionL1Loss=0.1037 + throughput/total_tokens=184,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=964/500000] + train/ActionL1Loss=0.0959 + throughput/total_tokens=185,088,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=965/500000] + train/ActionL1Loss=0.1139 + throughput/total_tokens=185,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=966/500000] + train/ActionL1Loss=0.0962 + throughput/total_tokens=185,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=967/500000] + train/ActionL1Loss=0.1026 + throughput/total_tokens=185,664,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=968/500000] + train/ActionL1Loss=0.1177 + throughput/total_tokens=185,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=969/500000] + train/ActionL1Loss=0.0994 + throughput/total_tokens=186,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=970/500000] + train/ActionL1Loss=0.1001 + throughput/total_tokens=186,240,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=971/500000] + train/ActionL1Loss=0.0982 + throughput/total_tokens=186,432,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=972/500000] + train/ActionL1Loss=0.0953 + throughput/total_tokens=186,624,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=973/500000] + train/ActionL1Loss=0.1013 + throughput/total_tokens=186,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=974/500000] + train/ActionL1Loss=0.1128 + throughput/total_tokens=187,008,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=975/500000] + train/ActionL1Loss=0.1091 + throughput/total_tokens=187,200,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=976/500000] + train/ActionL1Loss=0.1024 + throughput/total_tokens=187,392,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=977/500000] + train/ActionL1Loss=0.0934 + throughput/total_tokens=187,584,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=978/500000] + train/ActionL1Loss=0.1048 + throughput/total_tokens=187,776,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=979/500000] + train/ActionL1Loss=0.0925 + throughput/total_tokens=187,968,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=980/500000] + optim/total_grad_norm=11.20 + train/ActionL1Loss=0.0916 + throughput/total_tokens=188,160,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=981/500000] + train/ActionL1Loss=0.1006 + throughput/total_tokens=188,352,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=982/500000] + train/ActionL1Loss=0.0938 + throughput/total_tokens=188,544,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=983/500000] + train/ActionL1Loss=0.0867 + throughput/total_tokens=188,736,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=984/500000] + train/ActionL1Loss=0.0807 + throughput/total_tokens=188,928,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=985/500000] + train/ActionL1Loss=0.0996 + throughput/total_tokens=189,120,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=986/500000] + train/ActionL1Loss=0.0909 + throughput/total_tokens=189,312,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=987/500000] + train/ActionL1Loss=0.0928 + throughput/total_tokens=189,504,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=988/500000] + train/ActionL1Loss=0.1005 + throughput/total_tokens=189,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=989/500000] + train/ActionL1Loss=0.0909 + throughput/total_tokens=189,888,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=990/500000] + train/ActionL1Loss=0.0926 + throughput/total_tokens=190,080,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=991/500000] + train/ActionL1Loss=0.1016 + throughput/total_tokens=190,272,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=992/500000] + train/ActionL1Loss=0.1000 + throughput/total_tokens=190,464,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=993/500000] + train/ActionL1Loss=0.1123 + throughput/total_tokens=190,656,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=994/500000] + train/ActionL1Loss=0.0986 + throughput/total_tokens=190,848,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=995/500000] + train/ActionL1Loss=0.0930 + throughput/total_tokens=191,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=996/500000] + train/ActionL1Loss=0.1074 + throughput/total_tokens=191,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=997/500000] + train/ActionL1Loss=0.1023 + throughput/total_tokens=191,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=998/500000] + train/ActionL1Loss=0.0989 + throughput/total_tokens=191,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=999/500000] + train/ActionL1Loss=0.1050 + throughput/total_tokens=191,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1000/500000] + optim/total_grad_norm=12.36 + train/ActionL1Loss=0.0872 + throughput/total_tokens=192,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +10/11 [22:26:33] INFO | >> Saving config... checkpoint.py:608 +10/11 [22:27:04] INFO | >> Saving model state... checkpoint.py:796 +10/11 [22:28:17] INFO | >> Saving optim state... checkpoint.py:811 +10/11 [22:29:49] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=1001/500000] + train/ActionL1Loss=0.0914 + throughput/total_tokens=192,192,000 + throughput/device/tokens_per_second=1,208 + throughput/device/batches_per_second=0.0503 +[step=1002/500000] + train/ActionL1Loss=0.1081 + throughput/total_tokens=192,384,000 + throughput/device/tokens_per_second=1,187 + throughput/device/batches_per_second=0.0495 +[step=1003/500000] + train/ActionL1Loss=0.0889 + throughput/total_tokens=192,576,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1004/500000] + train/ActionL1Loss=0.0915 + throughput/total_tokens=192,768,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1005/500000] + train/ActionL1Loss=0.0946 + throughput/total_tokens=192,960,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1006/500000] + train/ActionL1Loss=0.0865 + throughput/total_tokens=193,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1007/500000] + train/ActionL1Loss=0.0866 + throughput/total_tokens=193,344,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1008/500000] + train/ActionL1Loss=0.1090 + throughput/total_tokens=193,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1009/500000] + train/ActionL1Loss=0.0935 + throughput/total_tokens=193,728,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1010/500000] + train/ActionL1Loss=0.0928 + throughput/total_tokens=193,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1011/500000] + train/ActionL1Loss=0.0803 + throughput/total_tokens=194,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1012/500000] + train/ActionL1Loss=0.1044 + throughput/total_tokens=194,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1013/500000] + train/ActionL1Loss=0.0793 + throughput/total_tokens=194,496,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1014/500000] + train/ActionL1Loss=0.0933 + throughput/total_tokens=194,688,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1015/500000] + train/ActionL1Loss=0.1049 + throughput/total_tokens=194,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1016/500000] + train/ActionL1Loss=0.0837 + throughput/total_tokens=195,072,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1017/500000] + train/ActionL1Loss=0.0986 + throughput/total_tokens=195,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1018/500000] + train/ActionL1Loss=0.1143 + throughput/total_tokens=195,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1019/500000] + train/ActionL1Loss=0.0922 + throughput/total_tokens=195,648,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1020/500000] + optim/total_grad_norm=13.41 + train/ActionL1Loss=0.1014 + throughput/total_tokens=195,840,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1021/500000] + train/ActionL1Loss=0.1208 + throughput/total_tokens=196,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1022/500000] + train/ActionL1Loss=0.0955 + throughput/total_tokens=196,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1023/500000] + train/ActionL1Loss=0.1035 + throughput/total_tokens=196,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1024/500000] + train/ActionL1Loss=0.0921 + throughput/total_tokens=196,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1025/500000] + train/ActionL1Loss=0.1056 + throughput/total_tokens=196,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1026/500000] + train/ActionL1Loss=0.0883 + throughput/total_tokens=196,992,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1027/500000] + train/ActionL1Loss=0.1073 + throughput/total_tokens=197,184,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1028/500000] + train/ActionL1Loss=0.0929 + throughput/total_tokens=197,376,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1029/500000] + train/ActionL1Loss=0.0810 + throughput/total_tokens=197,568,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1030/500000] + train/ActionL1Loss=0.0829 + throughput/total_tokens=197,760,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1031/500000] + train/ActionL1Loss=0.0835 + throughput/total_tokens=197,952,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1032/500000] + train/ActionL1Loss=0.1003 + throughput/total_tokens=198,144,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1033/500000] + train/ActionL1Loss=0.0949 + throughput/total_tokens=198,336,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1034/500000] + train/ActionL1Loss=0.0902 + throughput/total_tokens=198,528,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1035/500000] + train/ActionL1Loss=0.0946 + throughput/total_tokens=198,720,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1036/500000] + train/ActionL1Loss=0.0880 + throughput/total_tokens=198,912,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1037/500000] + train/ActionL1Loss=0.0890 + throughput/total_tokens=199,104,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1038/500000] + train/ActionL1Loss=0.0926 + throughput/total_tokens=199,296,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1039/500000] + train/ActionL1Loss=0.0907 + throughput/total_tokens=199,488,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1040/500000] + optim/total_grad_norm=13.36 + train/ActionL1Loss=0.0971 + throughput/total_tokens=199,680,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1041/500000] + train/ActionL1Loss=0.0926 + throughput/total_tokens=199,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1042/500000] + train/ActionL1Loss=0.1013 + throughput/total_tokens=200,064,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1043/500000] + train/ActionL1Loss=0.0984 + throughput/total_tokens=200,256,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1044/500000] + train/ActionL1Loss=0.1013 + throughput/total_tokens=200,448,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1045/500000] + train/ActionL1Loss=0.1003 + throughput/total_tokens=200,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1046/500000] + train/ActionL1Loss=0.1042 + throughput/total_tokens=200,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1047/500000] + train/ActionL1Loss=0.0960 + throughput/total_tokens=201,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1048/500000] + train/ActionL1Loss=0.0935 + throughput/total_tokens=201,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1049/500000] + train/ActionL1Loss=0.1007 + throughput/total_tokens=201,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1050/500000] + train/ActionL1Loss=0.0845 + throughput/total_tokens=201,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1051/500000] + train/ActionL1Loss=0.0846 + throughput/total_tokens=201,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1052/500000] + train/ActionL1Loss=0.0845 + throughput/total_tokens=201,984,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1053/500000] + train/ActionL1Loss=0.0924 + throughput/total_tokens=202,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1054/500000] + train/ActionL1Loss=0.0879 + throughput/total_tokens=202,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1055/500000] + train/ActionL1Loss=0.0992 + throughput/total_tokens=202,560,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1056/500000] + train/ActionL1Loss=0.0978 + throughput/total_tokens=202,752,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1057/500000] + train/ActionL1Loss=0.1031 + throughput/total_tokens=202,944,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1058/500000] + train/ActionL1Loss=0.0882 + throughput/total_tokens=203,136,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1059/500000] + train/ActionL1Loss=0.0863 + throughput/total_tokens=203,328,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1060/500000] + optim/total_grad_norm=13.73 + train/ActionL1Loss=0.0898 + throughput/total_tokens=203,520,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1061/500000] + train/ActionL1Loss=0.0943 + throughput/total_tokens=203,712,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1062/500000] + train/ActionL1Loss=0.0906 + throughput/total_tokens=203,904,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1063/500000] + train/ActionL1Loss=0.1000 + throughput/total_tokens=204,096,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1064/500000] + train/ActionL1Loss=0.0958 + throughput/total_tokens=204,288,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1065/500000] + train/ActionL1Loss=0.1167 + throughput/total_tokens=204,480,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1066/500000] + train/ActionL1Loss=0.0914 + throughput/total_tokens=204,672,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1067/500000] + train/ActionL1Loss=0.1102 + throughput/total_tokens=204,864,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1068/500000] + train/ActionL1Loss=0.1043 + throughput/total_tokens=205,056,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1069/500000] + train/ActionL1Loss=0.1057 + throughput/total_tokens=205,248,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1070/500000] + train/ActionL1Loss=0.0964 + throughput/total_tokens=205,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1071/500000] + train/ActionL1Loss=0.0914 + throughput/total_tokens=205,632,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1072/500000] + train/ActionL1Loss=0.0899 + throughput/total_tokens=205,824,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1073/500000] + train/ActionL1Loss=0.0916 + throughput/total_tokens=206,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1074/500000] + train/ActionL1Loss=0.1010 + throughput/total_tokens=206,208,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1075/500000] + train/ActionL1Loss=0.0939 + throughput/total_tokens=206,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1076/500000] + train/ActionL1Loss=0.0979 + throughput/total_tokens=206,592,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1077/500000] + train/ActionL1Loss=0.0817 + throughput/total_tokens=206,784,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1078/500000] + train/ActionL1Loss=0.1015 + throughput/total_tokens=206,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1079/500000] + train/ActionL1Loss=0.1016 + throughput/total_tokens=207,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1080/500000] + optim/total_grad_norm=10.78 + train/ActionL1Loss=0.1150 + throughput/total_tokens=207,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1081/500000] + train/ActionL1Loss=0.0860 + throughput/total_tokens=207,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1082/500000] + train/ActionL1Loss=0.0910 + throughput/total_tokens=207,744,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1083/500000] + train/ActionL1Loss=0.0967 + throughput/total_tokens=207,936,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1084/500000] + train/ActionL1Loss=0.0887 + throughput/total_tokens=208,128,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1085/500000] + train/ActionL1Loss=0.0836 + throughput/total_tokens=208,320,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1086/500000] + train/ActionL1Loss=0.0804 + throughput/total_tokens=208,512,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1087/500000] + train/ActionL1Loss=0.1091 + throughput/total_tokens=208,704,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1088/500000] + train/ActionL1Loss=0.0715 + throughput/total_tokens=208,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1089/500000] + train/ActionL1Loss=0.0739 + throughput/total_tokens=209,088,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1090/500000] + train/ActionL1Loss=0.1044 + throughput/total_tokens=209,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1091/500000] + train/ActionL1Loss=0.0979 + throughput/total_tokens=209,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1092/500000] + train/ActionL1Loss=0.0912 + throughput/total_tokens=209,664,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1093/500000] + train/ActionL1Loss=0.0954 + throughput/total_tokens=209,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1094/500000] + train/ActionL1Loss=0.0746 + throughput/total_tokens=210,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1095/500000] + train/ActionL1Loss=0.1011 + throughput/total_tokens=210,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1096/500000] + train/ActionL1Loss=0.0955 + throughput/total_tokens=210,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1097/500000] + train/ActionL1Loss=0.0996 + throughput/total_tokens=210,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1098/500000] + train/ActionL1Loss=0.0917 + throughput/total_tokens=210,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1099/500000] + train/ActionL1Loss=0.0903 + throughput/total_tokens=211,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1100/500000] + optim/total_grad_norm=13.16 + train/ActionL1Loss=0.0839 + throughput/total_tokens=211,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1101/500000] + train/ActionL1Loss=0.0824 + throughput/total_tokens=211,392,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1102/500000] + train/ActionL1Loss=0.0952 + throughput/total_tokens=211,584,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1103/500000] + train/ActionL1Loss=0.0938 + throughput/total_tokens=211,776,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1104/500000] + train/ActionL1Loss=0.0938 + throughput/total_tokens=211,968,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1105/500000] + train/ActionL1Loss=0.0865 + throughput/total_tokens=212,160,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=1106/500000] + train/ActionL1Loss=0.0907 + throughput/total_tokens=212,352,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1107/500000] + train/ActionL1Loss=0.1024 + throughput/total_tokens=212,544,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1108/500000] + train/ActionL1Loss=0.0960 + throughput/total_tokens=212,736,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1109/500000] + train/ActionL1Loss=0.0788 + throughput/total_tokens=212,928,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1110/500000] + train/ActionL1Loss=0.0843 + throughput/total_tokens=213,120,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=1111/500000] + train/ActionL1Loss=0.0994 + throughput/total_tokens=213,312,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1112/500000] + train/ActionL1Loss=0.0887 + throughput/total_tokens=213,504,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1113/500000] + train/ActionL1Loss=0.0895 + throughput/total_tokens=213,696,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1114/500000] + train/ActionL1Loss=0.0918 + throughput/total_tokens=213,888,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1115/500000] + train/ActionL1Loss=0.0859 + throughput/total_tokens=214,080,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1116/500000] + train/ActionL1Loss=0.1030 + throughput/total_tokens=214,272,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1117/500000] + train/ActionL1Loss=0.1142 + throughput/total_tokens=214,464,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1118/500000] + train/ActionL1Loss=0.0860 + throughput/total_tokens=214,656,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=1119/500000] + train/ActionL1Loss=0.0763 + throughput/total_tokens=214,848,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=1120/500000] + optim/total_grad_norm=11.46 + train/ActionL1Loss=0.0903 + throughput/total_tokens=215,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1121/500000] + train/ActionL1Loss=0.0854 + throughput/total_tokens=215,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1122/500000] + train/ActionL1Loss=0.0964 + throughput/total_tokens=215,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1123/500000] + train/ActionL1Loss=0.0823 + throughput/total_tokens=215,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1124/500000] + train/ActionL1Loss=0.0874 + throughput/total_tokens=215,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1125/500000] + train/ActionL1Loss=0.0788 + throughput/total_tokens=216,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1126/500000] + train/ActionL1Loss=0.0888 + throughput/total_tokens=216,192,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1127/500000] + train/ActionL1Loss=0.0820 + throughput/total_tokens=216,384,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1128/500000] + train/ActionL1Loss=0.0963 + throughput/total_tokens=216,576,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1129/500000] + train/ActionL1Loss=0.0903 + throughput/total_tokens=216,768,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1130/500000] + train/ActionL1Loss=0.0954 + throughput/total_tokens=216,960,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1131/500000] + train/ActionL1Loss=0.0985 + throughput/total_tokens=217,152,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1132/500000] + train/ActionL1Loss=0.0955 + throughput/total_tokens=217,344,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1133/500000] + train/ActionL1Loss=0.0810 + throughput/total_tokens=217,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1134/500000] + train/ActionL1Loss=0.0944 + throughput/total_tokens=217,728,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1135/500000] + train/ActionL1Loss=0.0918 + throughput/total_tokens=217,920,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1136/500000] + train/ActionL1Loss=0.0806 + throughput/total_tokens=218,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1137/500000] + train/ActionL1Loss=0.0914 + throughput/total_tokens=218,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1138/500000] + train/ActionL1Loss=0.0880 + throughput/total_tokens=218,496,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1139/500000] + train/ActionL1Loss=0.0964 + throughput/total_tokens=218,688,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1140/500000] + optim/total_grad_norm=12.67 + train/ActionL1Loss=0.0888 + throughput/total_tokens=218,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1141/500000] + train/ActionL1Loss=0.0903 + throughput/total_tokens=219,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1142/500000] + train/ActionL1Loss=0.1045 + throughput/total_tokens=219,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1143/500000] + train/ActionL1Loss=0.1152 + throughput/total_tokens=219,456,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1144/500000] + train/ActionL1Loss=0.1029 + throughput/total_tokens=219,648,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1145/500000] + train/ActionL1Loss=0.0925 + throughput/total_tokens=219,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1146/500000] + train/ActionL1Loss=0.0935 + throughput/total_tokens=220,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1147/500000] + train/ActionL1Loss=0.1088 + throughput/total_tokens=220,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1148/500000] + train/ActionL1Loss=0.0981 + throughput/total_tokens=220,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1149/500000] + train/ActionL1Loss=0.0868 + throughput/total_tokens=220,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1150/500000] + train/ActionL1Loss=0.0913 + throughput/total_tokens=220,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1151/500000] + train/ActionL1Loss=0.1048 + throughput/total_tokens=220,992,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1152/500000] + train/ActionL1Loss=0.0947 + throughput/total_tokens=221,184,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1153/500000] + train/ActionL1Loss=0.0920 + throughput/total_tokens=221,376,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1154/500000] + train/ActionL1Loss=0.0995 + throughput/total_tokens=221,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1155/500000] + train/ActionL1Loss=0.0928 + throughput/total_tokens=221,760,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1156/500000] + train/ActionL1Loss=0.1230 + throughput/total_tokens=221,952,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1157/500000] + train/ActionL1Loss=0.1045 + throughput/total_tokens=222,144,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1158/500000] + train/ActionL1Loss=0.0919 + throughput/total_tokens=222,336,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1159/500000] + train/ActionL1Loss=0.0941 + throughput/total_tokens=222,528,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1160/500000] + optim/total_grad_norm=13.06 + train/ActionL1Loss=0.0842 + throughput/total_tokens=222,720,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1161/500000] + train/ActionL1Loss=0.0775 + throughput/total_tokens=222,912,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1162/500000] + train/ActionL1Loss=0.0901 + throughput/total_tokens=223,104,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1163/500000] + train/ActionL1Loss=0.0928 + throughput/total_tokens=223,296,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1164/500000] + train/ActionL1Loss=0.0890 + throughput/total_tokens=223,488,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1165/500000] + train/ActionL1Loss=0.0889 + throughput/total_tokens=223,680,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1166/500000] + train/ActionL1Loss=0.1052 + throughput/total_tokens=223,872,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1167/500000] + train/ActionL1Loss=0.1080 + throughput/total_tokens=224,064,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1168/500000] + train/ActionL1Loss=0.1007 + throughput/total_tokens=224,256,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1169/500000] + train/ActionL1Loss=0.0748 + throughput/total_tokens=224,448,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1170/500000] + train/ActionL1Loss=0.0928 + throughput/total_tokens=224,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1171/500000] + train/ActionL1Loss=0.0988 + throughput/total_tokens=224,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1172/500000] + train/ActionL1Loss=0.0858 + throughput/total_tokens=225,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1173/500000] + train/ActionL1Loss=0.1018 + throughput/total_tokens=225,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1174/500000] + train/ActionL1Loss=0.0967 + throughput/total_tokens=225,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1175/500000] + train/ActionL1Loss=0.0972 + throughput/total_tokens=225,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1176/500000] + train/ActionL1Loss=0.1141 + throughput/total_tokens=225,792,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1177/500000] + train/ActionL1Loss=0.1009 + throughput/total_tokens=225,984,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1178/500000] + train/ActionL1Loss=0.0913 + throughput/total_tokens=226,176,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1179/500000] + train/ActionL1Loss=0.1066 + throughput/total_tokens=226,368,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1180/500000] + optim/total_grad_norm=12.35 + train/ActionL1Loss=0.0994 + throughput/total_tokens=226,560,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1181/500000] + train/ActionL1Loss=0.1055 + throughput/total_tokens=226,752,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1182/500000] + train/ActionL1Loss=0.0997 + throughput/total_tokens=226,944,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1183/500000] + train/ActionL1Loss=0.0892 + throughput/total_tokens=227,136,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1184/500000] + train/ActionL1Loss=0.0988 + throughput/total_tokens=227,328,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1185/500000] + train/ActionL1Loss=0.1116 + throughput/total_tokens=227,520,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1186/500000] + train/ActionL1Loss=0.1139 + throughput/total_tokens=227,712,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1187/500000] + train/ActionL1Loss=0.0825 + throughput/total_tokens=227,904,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1188/500000] + train/ActionL1Loss=0.1088 + throughput/total_tokens=228,096,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1189/500000] + train/ActionL1Loss=0.1031 + throughput/total_tokens=228,288,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1190/500000] + train/ActionL1Loss=0.0933 + throughput/total_tokens=228,480,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1191/500000] + train/ActionL1Loss=0.0960 + throughput/total_tokens=228,672,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1192/500000] + train/ActionL1Loss=0.1032 + throughput/total_tokens=228,864,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1193/500000] + train/ActionL1Loss=0.1104 + throughput/total_tokens=229,056,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1194/500000] + train/ActionL1Loss=0.1069 + throughput/total_tokens=229,248,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1195/500000] + train/ActionL1Loss=0.1000 + throughput/total_tokens=229,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1196/500000] + train/ActionL1Loss=0.1066 + throughput/total_tokens=229,632,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1197/500000] + train/ActionL1Loss=0.1115 + throughput/total_tokens=229,824,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1198/500000] + train/ActionL1Loss=0.1031 + throughput/total_tokens=230,016,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1199/500000] + train/ActionL1Loss=0.1037 + throughput/total_tokens=230,208,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1200/500000] + optim/total_grad_norm=11.16 + train/ActionL1Loss=0.1022 + throughput/total_tokens=230,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1201/500000] + train/ActionL1Loss=0.1072 + throughput/total_tokens=230,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1202/500000] + train/ActionL1Loss=0.0839 + throughput/total_tokens=230,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1203/500000] + train/ActionL1Loss=0.0909 + throughput/total_tokens=230,976,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1204/500000] + train/ActionL1Loss=0.1033 + throughput/total_tokens=231,168,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1205/500000] + train/ActionL1Loss=0.0802 + throughput/total_tokens=231,360,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1206/500000] + train/ActionL1Loss=0.1034 + throughput/total_tokens=231,552,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1207/500000] + train/ActionL1Loss=0.0993 + throughput/total_tokens=231,744,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1208/500000] + train/ActionL1Loss=0.0946 + throughput/total_tokens=231,936,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=1209/500000] + train/ActionL1Loss=0.0842 + throughput/total_tokens=232,128,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=1210/500000] + train/ActionL1Loss=0.0877 + throughput/total_tokens=232,320,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=1211/500000] + train/ActionL1Loss=0.0974 + throughput/total_tokens=232,512,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1212/500000] + train/ActionL1Loss=0.0978 + throughput/total_tokens=232,704,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1213/500000] + train/ActionL1Loss=0.1021 + throughput/total_tokens=232,896,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1214/500000] + train/ActionL1Loss=0.0956 + throughput/total_tokens=233,088,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1215/500000] + train/ActionL1Loss=0.0963 + throughput/total_tokens=233,280,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1216/500000] + train/ActionL1Loss=0.1040 + throughput/total_tokens=233,472,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1217/500000] + train/ActionL1Loss=0.1060 + throughput/total_tokens=233,664,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1218/500000] + train/ActionL1Loss=0.1058 + throughput/total_tokens=233,856,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1219/500000] + train/ActionL1Loss=0.1019 + throughput/total_tokens=234,048,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1220/500000] + optim/total_grad_norm=12.13 + train/ActionL1Loss=0.1064 + throughput/total_tokens=234,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1221/500000] + train/ActionL1Loss=0.0948 + throughput/total_tokens=234,432,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1222/500000] + train/ActionL1Loss=0.1084 + throughput/total_tokens=234,624,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1223/500000] + train/ActionL1Loss=0.0906 + throughput/total_tokens=234,816,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1224/500000] + train/ActionL1Loss=0.0976 + throughput/total_tokens=235,008,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1225/500000] + train/ActionL1Loss=0.0768 + throughput/total_tokens=235,200,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1226/500000] + train/ActionL1Loss=0.0787 + throughput/total_tokens=235,392,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1227/500000] + train/ActionL1Loss=0.0886 + throughput/total_tokens=235,584,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=1228/500000] + train/ActionL1Loss=0.0863 + throughput/total_tokens=235,776,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=1229/500000] + train/ActionL1Loss=0.0743 + throughput/total_tokens=235,968,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=1230/500000] + train/ActionL1Loss=0.0730 + throughput/total_tokens=236,160,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1231/500000] + train/ActionL1Loss=0.0850 + throughput/total_tokens=236,352,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1232/500000] + train/ActionL1Loss=0.0800 + throughput/total_tokens=236,544,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1233/500000] + train/ActionL1Loss=0.0902 + throughput/total_tokens=236,736,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1234/500000] + train/ActionL1Loss=0.0810 + throughput/total_tokens=236,928,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1235/500000] + train/ActionL1Loss=0.0847 + throughput/total_tokens=237,120,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1236/500000] + train/ActionL1Loss=0.1025 + throughput/total_tokens=237,312,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1237/500000] + train/ActionL1Loss=0.0899 + throughput/total_tokens=237,504,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1238/500000] + train/ActionL1Loss=0.0922 + throughput/total_tokens=237,696,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1239/500000] + train/ActionL1Loss=0.0618 + throughput/total_tokens=237,888,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1240/500000] + optim/total_grad_norm=11.98 + train/ActionL1Loss=0.0934 + throughput/total_tokens=238,080,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1241/500000] + train/ActionL1Loss=0.0870 + throughput/total_tokens=238,272,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1242/500000] + train/ActionL1Loss=0.0877 + throughput/total_tokens=238,464,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1243/500000] + train/ActionL1Loss=0.0857 + throughput/total_tokens=238,656,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1244/500000] + train/ActionL1Loss=0.0944 + throughput/total_tokens=238,848,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1245/500000] + train/ActionL1Loss=0.0801 + throughput/total_tokens=239,040,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1246/500000] + train/ActionL1Loss=0.0764 + throughput/total_tokens=239,232,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1247/500000] + train/ActionL1Loss=0.0827 + throughput/total_tokens=239,424,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1248/500000] + train/ActionL1Loss=0.0856 + throughput/total_tokens=239,616,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1249/500000] + train/ActionL1Loss=0.1028 + throughput/total_tokens=239,808,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1250/500000] + train/ActionL1Loss=0.0904 + throughput/total_tokens=240,000,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1251/500000] + train/ActionL1Loss=0.1003 + throughput/total_tokens=240,192,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1252/500000] + train/ActionL1Loss=0.0861 + throughput/total_tokens=240,384,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1253/500000] + train/ActionL1Loss=0.0878 + throughput/total_tokens=240,576,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1254/500000] + train/ActionL1Loss=0.0845 + throughput/total_tokens=240,768,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1255/500000] + train/ActionL1Loss=0.0882 + throughput/total_tokens=240,960,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1256/500000] + train/ActionL1Loss=0.0866 + throughput/total_tokens=241,152,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1257/500000] + train/ActionL1Loss=0.0880 + throughput/total_tokens=241,344,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1258/500000] + train/ActionL1Loss=0.0691 + throughput/total_tokens=241,536,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1259/500000] + train/ActionL1Loss=0.0994 + throughput/total_tokens=241,728,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1260/500000] + optim/total_grad_norm=12.51 + train/ActionL1Loss=0.0746 + throughput/total_tokens=241,920,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=1261/500000] + train/ActionL1Loss=0.0855 + throughput/total_tokens=242,112,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1262/500000] + train/ActionL1Loss=0.0967 + throughput/total_tokens=242,304,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1263/500000] + train/ActionL1Loss=0.0913 + throughput/total_tokens=242,496,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1264/500000] + train/ActionL1Loss=0.0937 + throughput/total_tokens=242,688,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1265/500000] + train/ActionL1Loss=0.1016 + throughput/total_tokens=242,880,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1266/500000] + train/ActionL1Loss=0.0907 + throughput/total_tokens=243,072,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1267/500000] + train/ActionL1Loss=0.0829 + throughput/total_tokens=243,264,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1268/500000] + train/ActionL1Loss=0.1029 + throughput/total_tokens=243,456,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1269/500000] + train/ActionL1Loss=0.0909 + throughput/total_tokens=243,648,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1270/500000] + train/ActionL1Loss=0.1067 + throughput/total_tokens=243,840,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1271/500000] + train/ActionL1Loss=0.0945 + throughput/total_tokens=244,032,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1272/500000] + train/ActionL1Loss=0.1007 + throughput/total_tokens=244,224,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1273/500000] + train/ActionL1Loss=0.0868 + throughput/total_tokens=244,416,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1274/500000] + train/ActionL1Loss=0.1085 + throughput/total_tokens=244,608,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1275/500000] + train/ActionL1Loss=0.1130 + throughput/total_tokens=244,800,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1276/500000] + train/ActionL1Loss=0.1104 + throughput/total_tokens=244,992,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1277/500000] + train/ActionL1Loss=0.0943 + throughput/total_tokens=245,184,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1278/500000] + train/ActionL1Loss=0.0927 + throughput/total_tokens=245,376,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1279/500000] + train/ActionL1Loss=0.1079 + throughput/total_tokens=245,568,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1280/500000] + optim/total_grad_norm=12.36 + train/ActionL1Loss=0.1045 + throughput/total_tokens=245,760,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1281/500000] + train/ActionL1Loss=0.0873 + throughput/total_tokens=245,952,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1282/500000] + train/ActionL1Loss=0.0945 + throughput/total_tokens=246,144,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1283/500000] + train/ActionL1Loss=0.0766 + throughput/total_tokens=246,336,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1284/500000] + train/ActionL1Loss=0.0815 + throughput/total_tokens=246,528,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1285/500000] + train/ActionL1Loss=0.0850 + throughput/total_tokens=246,720,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1286/500000] + train/ActionL1Loss=0.0792 + throughput/total_tokens=246,912,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1287/500000] + train/ActionL1Loss=0.0825 + throughput/total_tokens=247,104,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1288/500000] + train/ActionL1Loss=0.0916 + throughput/total_tokens=247,296,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1289/500000] + train/ActionL1Loss=0.0847 + throughput/total_tokens=247,488,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1290/500000] + train/ActionL1Loss=0.0881 + throughput/total_tokens=247,680,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1291/500000] + train/ActionL1Loss=0.0805 + throughput/total_tokens=247,872,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1292/500000] + train/ActionL1Loss=0.0853 + throughput/total_tokens=248,064,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1293/500000] + train/ActionL1Loss=0.0816 + throughput/total_tokens=248,256,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1294/500000] + train/ActionL1Loss=0.0774 + throughput/total_tokens=248,448,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1295/500000] + train/ActionL1Loss=0.0964 + throughput/total_tokens=248,640,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1296/500000] + train/ActionL1Loss=0.1024 + throughput/total_tokens=248,832,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1297/500000] + train/ActionL1Loss=0.0835 + throughput/total_tokens=249,024,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1298/500000] + train/ActionL1Loss=0.0852 + throughput/total_tokens=249,216,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1299/500000] + train/ActionL1Loss=0.0935 + throughput/total_tokens=249,408,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1300/500000] + optim/total_grad_norm=10.15 + train/ActionL1Loss=0.0861 + throughput/total_tokens=249,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1301/500000] + train/ActionL1Loss=0.0828 + throughput/total_tokens=249,792,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1302/500000] + train/ActionL1Loss=0.0983 + throughput/total_tokens=249,984,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1303/500000] + train/ActionL1Loss=0.0856 + throughput/total_tokens=250,176,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1304/500000] + train/ActionL1Loss=0.0838 + throughput/total_tokens=250,368,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1305/500000] + train/ActionL1Loss=0.0979 + throughput/total_tokens=250,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1306/500000] + train/ActionL1Loss=0.0839 + throughput/total_tokens=250,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1307/500000] + train/ActionL1Loss=0.0857 + throughput/total_tokens=250,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1308/500000] + train/ActionL1Loss=0.0836 + throughput/total_tokens=251,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1309/500000] + train/ActionL1Loss=0.0827 + throughput/total_tokens=251,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1310/500000] + train/ActionL1Loss=0.0960 + throughput/total_tokens=251,520,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1311/500000] + train/ActionL1Loss=0.1020 + throughput/total_tokens=251,712,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1312/500000] + train/ActionL1Loss=0.1029 + throughput/total_tokens=251,904,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1313/500000] + train/ActionL1Loss=0.0844 + throughput/total_tokens=252,096,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1314/500000] + train/ActionL1Loss=0.1017 + throughput/total_tokens=252,288,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1315/500000] + train/ActionL1Loss=0.0911 + throughput/total_tokens=252,480,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1316/500000] + train/ActionL1Loss=0.0973 + throughput/total_tokens=252,672,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1317/500000] + train/ActionL1Loss=0.0870 + throughput/total_tokens=252,864,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1318/500000] + train/ActionL1Loss=0.0902 + throughput/total_tokens=253,056,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1319/500000] + train/ActionL1Loss=0.0995 + throughput/total_tokens=253,248,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1320/500000] + optim/total_grad_norm=12.73 + train/ActionL1Loss=0.1019 + throughput/total_tokens=253,440,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1321/500000] + train/ActionL1Loss=0.0982 + throughput/total_tokens=253,632,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1322/500000] + train/ActionL1Loss=0.0904 + throughput/total_tokens=253,824,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1323/500000] + train/ActionL1Loss=0.0930 + throughput/total_tokens=254,016,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1324/500000] + train/ActionL1Loss=0.0979 + throughput/total_tokens=254,208,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1325/500000] + train/ActionL1Loss=0.0806 + throughput/total_tokens=254,400,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1326/500000] + train/ActionL1Loss=0.0864 + throughput/total_tokens=254,592,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1327/500000] + train/ActionL1Loss=0.0846 + throughput/total_tokens=254,784,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1328/500000] + train/ActionL1Loss=0.0891 + throughput/total_tokens=254,976,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1329/500000] + train/ActionL1Loss=0.0859 + throughput/total_tokens=255,168,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1330/500000] + train/ActionL1Loss=0.0933 + throughput/total_tokens=255,360,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1331/500000] + train/ActionL1Loss=0.0900 + throughput/total_tokens=255,552,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1332/500000] + train/ActionL1Loss=0.0812 + throughput/total_tokens=255,744,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1333/500000] + train/ActionL1Loss=0.0992 + throughput/total_tokens=255,936,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1334/500000] + train/ActionL1Loss=0.0876 + throughput/total_tokens=256,128,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1335/500000] + train/ActionL1Loss=0.0757 + throughput/total_tokens=256,320,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1336/500000] + train/ActionL1Loss=0.0844 + throughput/total_tokens=256,512,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1337/500000] + train/ActionL1Loss=0.0776 + throughput/total_tokens=256,704,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1338/500000] + train/ActionL1Loss=0.0950 + throughput/total_tokens=256,896,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1339/500000] + train/ActionL1Loss=0.1061 + throughput/total_tokens=257,088,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1340/500000] + optim/total_grad_norm=11.58 + train/ActionL1Loss=0.1113 + throughput/total_tokens=257,280,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1341/500000] + train/ActionL1Loss=0.0832 + throughput/total_tokens=257,472,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1342/500000] + train/ActionL1Loss=0.0824 + throughput/total_tokens=257,664,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1343/500000] + train/ActionL1Loss=0.0769 + throughput/total_tokens=257,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1344/500000] + train/ActionL1Loss=0.0707 + throughput/total_tokens=258,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1345/500000] + train/ActionL1Loss=0.0702 + throughput/total_tokens=258,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1346/500000] + train/ActionL1Loss=0.0766 + throughput/total_tokens=258,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1347/500000] + train/ActionL1Loss=0.0885 + throughput/total_tokens=258,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1348/500000] + train/ActionL1Loss=0.0969 + throughput/total_tokens=258,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1349/500000] + train/ActionL1Loss=0.0866 + throughput/total_tokens=259,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1350/500000] + train/ActionL1Loss=0.0908 + throughput/total_tokens=259,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1351/500000] + train/ActionL1Loss=0.0758 + throughput/total_tokens=259,392,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1352/500000] + train/ActionL1Loss=0.0801 + throughput/total_tokens=259,584,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1353/500000] + train/ActionL1Loss=0.0882 + throughput/total_tokens=259,776,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1354/500000] + train/ActionL1Loss=0.0876 + throughput/total_tokens=259,968,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=1355/500000] + train/ActionL1Loss=0.1025 + throughput/total_tokens=260,160,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1356/500000] + train/ActionL1Loss=0.0944 + throughput/total_tokens=260,352,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1357/500000] + train/ActionL1Loss=0.0997 + throughput/total_tokens=260,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1358/500000] + train/ActionL1Loss=0.0969 + throughput/total_tokens=260,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1359/500000] + train/ActionL1Loss=0.0940 + throughput/total_tokens=260,928,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1360/500000] + optim/total_grad_norm=10.83 + train/ActionL1Loss=0.0956 + throughput/total_tokens=261,120,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1361/500000] + train/ActionL1Loss=0.0734 + throughput/total_tokens=261,312,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1362/500000] + train/ActionL1Loss=0.0981 + throughput/total_tokens=261,504,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1363/500000] + train/ActionL1Loss=0.0874 + throughput/total_tokens=261,696,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1364/500000] + train/ActionL1Loss=0.0903 + throughput/total_tokens=261,888,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1365/500000] + train/ActionL1Loss=0.0771 + throughput/total_tokens=262,080,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1366/500000] + train/ActionL1Loss=0.0846 + throughput/total_tokens=262,272,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1367/500000] + train/ActionL1Loss=0.0961 + throughput/total_tokens=262,464,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1368/500000] + train/ActionL1Loss=0.0828 + throughput/total_tokens=262,656,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1369/500000] + train/ActionL1Loss=0.0728 + throughput/total_tokens=262,848,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1370/500000] + train/ActionL1Loss=0.0884 + throughput/total_tokens=263,040,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1371/500000] + train/ActionL1Loss=0.1028 + throughput/total_tokens=263,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1372/500000] + train/ActionL1Loss=0.0857 + throughput/total_tokens=263,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1373/500000] + train/ActionL1Loss=0.0798 + throughput/total_tokens=263,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1374/500000] + train/ActionL1Loss=0.0762 + throughput/total_tokens=263,808,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1375/500000] + train/ActionL1Loss=0.0966 + throughput/total_tokens=264,000,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1376/500000] + train/ActionL1Loss=0.0858 + throughput/total_tokens=264,192,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1377/500000] + train/ActionL1Loss=0.1004 + throughput/total_tokens=264,384,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1378/500000] + train/ActionL1Loss=0.0922 + throughput/total_tokens=264,576,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1379/500000] + train/ActionL1Loss=0.1059 + throughput/total_tokens=264,768,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1380/500000] + optim/total_grad_norm=11.35 + train/ActionL1Loss=0.0893 + throughput/total_tokens=264,960,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1381/500000] + train/ActionL1Loss=0.0870 + throughput/total_tokens=265,152,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1382/500000] + train/ActionL1Loss=0.0899 + throughput/total_tokens=265,344,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1383/500000] + train/ActionL1Loss=0.0955 + throughput/total_tokens=265,536,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1384/500000] + train/ActionL1Loss=0.0966 + throughput/total_tokens=265,728,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1385/500000] + train/ActionL1Loss=0.0727 + throughput/total_tokens=265,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1386/500000] + train/ActionL1Loss=0.0848 + throughput/total_tokens=266,112,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1387/500000] + train/ActionL1Loss=0.0820 + throughput/total_tokens=266,304,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1388/500000] + train/ActionL1Loss=0.1004 + throughput/total_tokens=266,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1389/500000] + train/ActionL1Loss=0.0892 + throughput/total_tokens=266,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1390/500000] + train/ActionL1Loss=0.0731 + throughput/total_tokens=266,880,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1391/500000] + train/ActionL1Loss=0.0778 + throughput/total_tokens=267,072,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1392/500000] + train/ActionL1Loss=0.0872 + throughput/total_tokens=267,264,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1393/500000] + train/ActionL1Loss=0.1228 + throughput/total_tokens=267,456,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1394/500000] + train/ActionL1Loss=0.0896 + throughput/total_tokens=267,648,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1395/500000] + train/ActionL1Loss=0.1038 + throughput/total_tokens=267,840,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1396/500000] + train/ActionL1Loss=0.0961 + throughput/total_tokens=268,032,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1397/500000] + train/ActionL1Loss=0.0932 + throughput/total_tokens=268,224,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1398/500000] + train/ActionL1Loss=0.0868 + throughput/total_tokens=268,416,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1399/500000] + train/ActionL1Loss=0.0904 + throughput/total_tokens=268,608,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1400/500000] + optim/total_grad_norm=12.73 + train/ActionL1Loss=0.1015 + throughput/total_tokens=268,800,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1401/500000] + train/ActionL1Loss=0.0914 + throughput/total_tokens=268,992,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1402/500000] + train/ActionL1Loss=0.0938 + throughput/total_tokens=269,184,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1403/500000] + train/ActionL1Loss=0.1055 + throughput/total_tokens=269,376,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1404/500000] + train/ActionL1Loss=0.0969 + throughput/total_tokens=269,568,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1405/500000] + train/ActionL1Loss=0.0867 + throughput/total_tokens=269,760,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1406/500000] + train/ActionL1Loss=0.0959 + throughput/total_tokens=269,952,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1407/500000] + train/ActionL1Loss=0.1048 + throughput/total_tokens=270,144,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=1408/500000] + train/ActionL1Loss=0.0997 + throughput/total_tokens=270,336,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1409/500000] + train/ActionL1Loss=0.0917 + throughput/total_tokens=270,528,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1410/500000] + train/ActionL1Loss=0.0971 + throughput/total_tokens=270,720,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1411/500000] + train/ActionL1Loss=0.0845 + throughput/total_tokens=270,912,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1412/500000] + train/ActionL1Loss=0.0859 + throughput/total_tokens=271,104,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1413/500000] + train/ActionL1Loss=0.0820 + throughput/total_tokens=271,296,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1414/500000] + train/ActionL1Loss=0.0834 + throughput/total_tokens=271,488,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1415/500000] + train/ActionL1Loss=0.0843 + throughput/total_tokens=271,680,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1416/500000] + train/ActionL1Loss=0.0934 + throughput/total_tokens=271,872,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1417/500000] + train/ActionL1Loss=0.1004 + throughput/total_tokens=272,064,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1418/500000] + train/ActionL1Loss=0.0818 + throughput/total_tokens=272,256,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=1419/500000] + train/ActionL1Loss=0.0848 + throughput/total_tokens=272,448,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=1420/500000] + optim/total_grad_norm=10.04 + train/ActionL1Loss=0.0839 + throughput/total_tokens=272,640,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1421/500000] + train/ActionL1Loss=0.0904 + throughput/total_tokens=272,832,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1422/500000] + train/ActionL1Loss=0.0697 + throughput/total_tokens=273,024,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1423/500000] + train/ActionL1Loss=0.0794 + throughput/total_tokens=273,216,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1424/500000] + train/ActionL1Loss=0.0941 + throughput/total_tokens=273,408,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1425/500000] + train/ActionL1Loss=0.0809 + throughput/total_tokens=273,600,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1426/500000] + train/ActionL1Loss=0.0619 + throughput/total_tokens=273,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1427/500000] + train/ActionL1Loss=0.0830 + throughput/total_tokens=273,984,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1428/500000] + train/ActionL1Loss=0.0844 + throughput/total_tokens=274,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1429/500000] + train/ActionL1Loss=0.0808 + throughput/total_tokens=274,368,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1430/500000] + train/ActionL1Loss=0.0766 + throughput/total_tokens=274,560,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1431/500000] + train/ActionL1Loss=0.0817 + throughput/total_tokens=274,752,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1432/500000] + train/ActionL1Loss=0.0938 + throughput/total_tokens=274,944,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1433/500000] + train/ActionL1Loss=0.0944 + throughput/total_tokens=275,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1434/500000] + train/ActionL1Loss=0.0826 + throughput/total_tokens=275,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1435/500000] + train/ActionL1Loss=0.0926 + throughput/total_tokens=275,520,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1436/500000] + train/ActionL1Loss=0.0922 + throughput/total_tokens=275,712,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1437/500000] + train/ActionL1Loss=0.0841 + throughput/total_tokens=275,904,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1438/500000] + train/ActionL1Loss=0.0881 + throughput/total_tokens=276,096,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1439/500000] + train/ActionL1Loss=0.0873 + throughput/total_tokens=276,288,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1440/500000] + optim/total_grad_norm=10.64 + train/ActionL1Loss=0.0839 + throughput/total_tokens=276,480,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1441/500000] + train/ActionL1Loss=0.0996 + throughput/total_tokens=276,672,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1442/500000] + train/ActionL1Loss=0.0780 + throughput/total_tokens=276,864,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1443/500000] + train/ActionL1Loss=0.0974 + throughput/total_tokens=277,056,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1444/500000] + train/ActionL1Loss=0.0876 + throughput/total_tokens=277,248,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1445/500000] + train/ActionL1Loss=0.0938 + throughput/total_tokens=277,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1446/500000] + train/ActionL1Loss=0.0936 + throughput/total_tokens=277,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1447/500000] + train/ActionL1Loss=0.0760 + throughput/total_tokens=277,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1448/500000] + train/ActionL1Loss=0.0904 + throughput/total_tokens=278,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1449/500000] + train/ActionL1Loss=0.0858 + throughput/total_tokens=278,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1450/500000] + train/ActionL1Loss=0.0919 + throughput/total_tokens=278,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1451/500000] + train/ActionL1Loss=0.1064 + throughput/total_tokens=278,592,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1452/500000] + train/ActionL1Loss=0.1036 + throughput/total_tokens=278,784,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1453/500000] + train/ActionL1Loss=0.0833 + throughput/total_tokens=278,976,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1454/500000] + train/ActionL1Loss=0.1013 + throughput/total_tokens=279,168,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1455/500000] + train/ActionL1Loss=0.0885 + throughput/total_tokens=279,360,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1456/500000] + train/ActionL1Loss=0.0882 + throughput/total_tokens=279,552,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1457/500000] + train/ActionL1Loss=0.0947 + throughput/total_tokens=279,744,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1458/500000] + train/ActionL1Loss=0.0848 + throughput/total_tokens=279,936,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1459/500000] + train/ActionL1Loss=0.0841 + throughput/total_tokens=280,128,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1460/500000] + optim/total_grad_norm=10.16 + train/ActionL1Loss=0.0851 + throughput/total_tokens=280,320,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1461/500000] + train/ActionL1Loss=0.0837 + throughput/total_tokens=280,512,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1462/500000] + train/ActionL1Loss=0.0876 + throughput/total_tokens=280,704,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1463/500000] + train/ActionL1Loss=0.0872 + throughput/total_tokens=280,896,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1464/500000] + train/ActionL1Loss=0.0827 + throughput/total_tokens=281,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1465/500000] + train/ActionL1Loss=0.0910 + throughput/total_tokens=281,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1466/500000] + train/ActionL1Loss=0.1027 + throughput/total_tokens=281,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1467/500000] + train/ActionL1Loss=0.1076 + throughput/total_tokens=281,664,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1468/500000] + train/ActionL1Loss=0.0772 + throughput/total_tokens=281,856,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1469/500000] + train/ActionL1Loss=0.0864 + throughput/total_tokens=282,048,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1470/500000] + train/ActionL1Loss=0.0926 + throughput/total_tokens=282,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1471/500000] + train/ActionL1Loss=0.0887 + throughput/total_tokens=282,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1472/500000] + train/ActionL1Loss=0.0862 + throughput/total_tokens=282,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1473/500000] + train/ActionL1Loss=0.0917 + throughput/total_tokens=282,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1474/500000] + train/ActionL1Loss=0.0748 + throughput/total_tokens=283,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1475/500000] + train/ActionL1Loss=0.0919 + throughput/total_tokens=283,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1476/500000] + train/ActionL1Loss=0.0927 + throughput/total_tokens=283,392,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1477/500000] + train/ActionL1Loss=0.0890 + throughput/total_tokens=283,584,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1478/500000] + train/ActionL1Loss=0.0837 + throughput/total_tokens=283,776,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1479/500000] + train/ActionL1Loss=0.0969 + throughput/total_tokens=283,968,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1480/500000] + optim/total_grad_norm=9.878 + train/ActionL1Loss=0.0785 + throughput/total_tokens=284,160,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1481/500000] + train/ActionL1Loss=0.0937 + throughput/total_tokens=284,352,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1482/500000] + train/ActionL1Loss=0.0796 + throughput/total_tokens=284,544,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1483/500000] + train/ActionL1Loss=0.0755 + throughput/total_tokens=284,736,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1484/500000] + train/ActionL1Loss=0.0824 + throughput/total_tokens=284,928,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1485/500000] + train/ActionL1Loss=0.0882 + throughput/total_tokens=285,120,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1486/500000] + train/ActionL1Loss=0.0838 + throughput/total_tokens=285,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1487/500000] + train/ActionL1Loss=0.0854 + throughput/total_tokens=285,504,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1488/500000] + train/ActionL1Loss=0.0864 + throughput/total_tokens=285,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1489/500000] + train/ActionL1Loss=0.0875 + throughput/total_tokens=285,888,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1490/500000] + train/ActionL1Loss=0.0750 + throughput/total_tokens=286,080,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1491/500000] + train/ActionL1Loss=0.0979 + throughput/total_tokens=286,272,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1492/500000] + train/ActionL1Loss=0.0823 + throughput/total_tokens=286,464,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1493/500000] + train/ActionL1Loss=0.0901 + throughput/total_tokens=286,656,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1494/500000] + train/ActionL1Loss=0.0928 + throughput/total_tokens=286,848,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1495/500000] + train/ActionL1Loss=0.0927 + throughput/total_tokens=287,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1496/500000] + train/ActionL1Loss=0.0903 + throughput/total_tokens=287,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1497/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=287,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1498/500000] + train/ActionL1Loss=0.0970 + throughput/total_tokens=287,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1499/500000] + train/ActionL1Loss=0.0979 + throughput/total_tokens=287,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1500/500000] + optim/total_grad_norm=9.878 + train/ActionL1Loss=0.0969 + throughput/total_tokens=288,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +10/12 [01:21:10] INFO | >> Saving config... checkpoint.py:608 +10/12 [01:21:42] INFO | >> Saving model state... checkpoint.py:796 +10/12 [01:22:51] INFO | >> Saving optim state... checkpoint.py:811 +10/12 [01:24:22] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=1501/500000] + train/ActionL1Loss=0.0845 + throughput/total_tokens=288,192,000 + throughput/device/tokens_per_second=1,207 + throughput/device/batches_per_second=0.0503 +[step=1502/500000] + train/ActionL1Loss=0.1071 + throughput/total_tokens=288,384,000 + throughput/device/tokens_per_second=1,185 + throughput/device/batches_per_second=0.0494 +[step=1503/500000] + train/ActionL1Loss=0.0879 + throughput/total_tokens=288,576,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1504/500000] + train/ActionL1Loss=0.0869 + throughput/total_tokens=288,768,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=1505/500000] + train/ActionL1Loss=0.0951 + throughput/total_tokens=288,960,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=1506/500000] + train/ActionL1Loss=0.0879 + throughput/total_tokens=289,152,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1507/500000] + train/ActionL1Loss=0.0925 + throughput/total_tokens=289,344,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=1508/500000] + train/ActionL1Loss=0.0971 + throughput/total_tokens=289,536,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=1509/500000] + train/ActionL1Loss=0.1112 + throughput/total_tokens=289,728,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=1510/500000] + train/ActionL1Loss=0.0804 + throughput/total_tokens=289,920,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1511/500000] + train/ActionL1Loss=0.0631 + throughput/total_tokens=290,112,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1512/500000] + train/ActionL1Loss=0.0871 + throughput/total_tokens=290,304,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1513/500000] + train/ActionL1Loss=0.0902 + throughput/total_tokens=290,496,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1514/500000] + train/ActionL1Loss=0.0768 + throughput/total_tokens=290,688,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1515/500000] + train/ActionL1Loss=0.0908 + throughput/total_tokens=290,880,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1516/500000] + train/ActionL1Loss=0.0990 + throughput/total_tokens=291,072,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1517/500000] + train/ActionL1Loss=0.0941 + throughput/total_tokens=291,264,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1518/500000] + train/ActionL1Loss=0.0906 + throughput/total_tokens=291,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1519/500000] + train/ActionL1Loss=0.0962 + throughput/total_tokens=291,648,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1520/500000] + optim/total_grad_norm=10.80 + train/ActionL1Loss=0.0857 + throughput/total_tokens=291,840,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1521/500000] + train/ActionL1Loss=0.1028 + throughput/total_tokens=292,032,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1522/500000] + train/ActionL1Loss=0.0828 + throughput/total_tokens=292,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1523/500000] + train/ActionL1Loss=0.0822 + throughput/total_tokens=292,416,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1524/500000] + train/ActionL1Loss=0.0873 + throughput/total_tokens=292,608,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1525/500000] + train/ActionL1Loss=0.1062 + throughput/total_tokens=292,800,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1526/500000] + train/ActionL1Loss=0.0834 + throughput/total_tokens=292,992,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1527/500000] + train/ActionL1Loss=0.0820 + throughput/total_tokens=293,184,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1528/500000] + train/ActionL1Loss=0.0808 + throughput/total_tokens=293,376,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1529/500000] + train/ActionL1Loss=0.0887 + throughput/total_tokens=293,568,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1530/500000] + train/ActionL1Loss=0.0950 + throughput/total_tokens=293,760,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1531/500000] + train/ActionL1Loss=0.0845 + throughput/total_tokens=293,952,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1532/500000] + train/ActionL1Loss=0.0733 + throughput/total_tokens=294,144,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1533/500000] + train/ActionL1Loss=0.0866 + throughput/total_tokens=294,336,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1534/500000] + train/ActionL1Loss=0.0856 + throughput/total_tokens=294,528,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1535/500000] + train/ActionL1Loss=0.0905 + throughput/total_tokens=294,720,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1536/500000] + train/ActionL1Loss=0.0920 + throughput/total_tokens=294,912,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1537/500000] + train/ActionL1Loss=0.0865 + throughput/total_tokens=295,104,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1538/500000] + train/ActionL1Loss=0.0879 + throughput/total_tokens=295,296,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1539/500000] + train/ActionL1Loss=0.0808 + throughput/total_tokens=295,488,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1540/500000] + optim/total_grad_norm=11.50 + train/ActionL1Loss=0.0981 + throughput/total_tokens=295,680,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1541/500000] + train/ActionL1Loss=0.0964 + throughput/total_tokens=295,872,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1542/500000] + train/ActionL1Loss=0.0870 + throughput/total_tokens=296,064,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1543/500000] + train/ActionL1Loss=0.0872 + throughput/total_tokens=296,256,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1544/500000] + train/ActionL1Loss=0.0912 + throughput/total_tokens=296,448,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1545/500000] + train/ActionL1Loss=0.0803 + throughput/total_tokens=296,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1546/500000] + train/ActionL1Loss=0.0701 + throughput/total_tokens=296,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1547/500000] + train/ActionL1Loss=0.0824 + throughput/total_tokens=297,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1548/500000] + train/ActionL1Loss=0.0863 + throughput/total_tokens=297,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1549/500000] + train/ActionL1Loss=0.0824 + throughput/total_tokens=297,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1550/500000] + train/ActionL1Loss=0.0788 + throughput/total_tokens=297,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1551/500000] + train/ActionL1Loss=0.0697 + throughput/total_tokens=297,792,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1552/500000] + train/ActionL1Loss=0.0813 + throughput/total_tokens=297,984,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1553/500000] + train/ActionL1Loss=0.0675 + throughput/total_tokens=298,176,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1554/500000] + train/ActionL1Loss=0.0691 + throughput/total_tokens=298,368,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1555/500000] + train/ActionL1Loss=0.0901 + throughput/total_tokens=298,560,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1556/500000] + train/ActionL1Loss=0.0710 + throughput/total_tokens=298,752,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1557/500000] + train/ActionL1Loss=0.0885 + throughput/total_tokens=298,944,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1558/500000] + train/ActionL1Loss=0.0972 + throughput/total_tokens=299,136,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1559/500000] + train/ActionL1Loss=0.0844 + throughput/total_tokens=299,328,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1560/500000] + optim/total_grad_norm=9.098 + train/ActionL1Loss=0.0731 + throughput/total_tokens=299,520,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=1561/500000] + train/ActionL1Loss=0.0786 + throughput/total_tokens=299,712,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1562/500000] + train/ActionL1Loss=0.0681 + throughput/total_tokens=299,904,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1563/500000] + train/ActionL1Loss=0.0786 + throughput/total_tokens=300,096,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=1564/500000] + train/ActionL1Loss=0.0730 + throughput/total_tokens=300,288,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=1565/500000] + train/ActionL1Loss=0.0839 + throughput/total_tokens=300,480,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1566/500000] + train/ActionL1Loss=0.0747 + throughput/total_tokens=300,672,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1567/500000] + train/ActionL1Loss=0.0732 + throughput/total_tokens=300,864,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1568/500000] + train/ActionL1Loss=0.0731 + throughput/total_tokens=301,056,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1569/500000] + train/ActionL1Loss=0.0870 + throughput/total_tokens=301,248,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1570/500000] + train/ActionL1Loss=0.0952 + throughput/total_tokens=301,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1571/500000] + train/ActionL1Loss=0.0888 + throughput/total_tokens=301,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1572/500000] + train/ActionL1Loss=0.1000 + throughput/total_tokens=301,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1573/500000] + train/ActionL1Loss=0.0788 + throughput/total_tokens=302,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1574/500000] + train/ActionL1Loss=0.0924 + throughput/total_tokens=302,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1575/500000] + train/ActionL1Loss=0.0862 + throughput/total_tokens=302,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1576/500000] + train/ActionL1Loss=0.0991 + throughput/total_tokens=302,592,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1577/500000] + train/ActionL1Loss=0.0912 + throughput/total_tokens=302,784,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1578/500000] + train/ActionL1Loss=0.0999 + throughput/total_tokens=302,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1579/500000] + train/ActionL1Loss=0.0864 + throughput/total_tokens=303,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1580/500000] + optim/total_grad_norm=10.05 + train/ActionL1Loss=0.0770 + throughput/total_tokens=303,360,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1581/500000] + train/ActionL1Loss=0.0836 + throughput/total_tokens=303,552,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1582/500000] + train/ActionL1Loss=0.0991 + throughput/total_tokens=303,744,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1583/500000] + train/ActionL1Loss=0.0826 + throughput/total_tokens=303,936,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1584/500000] + train/ActionL1Loss=0.1004 + throughput/total_tokens=304,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1585/500000] + train/ActionL1Loss=0.0890 + throughput/total_tokens=304,320,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1586/500000] + train/ActionL1Loss=0.0818 + throughput/total_tokens=304,512,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1587/500000] + train/ActionL1Loss=0.0778 + throughput/total_tokens=304,704,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1588/500000] + train/ActionL1Loss=0.0813 + throughput/total_tokens=304,896,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1589/500000] + train/ActionL1Loss=0.0797 + throughput/total_tokens=305,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1590/500000] + train/ActionL1Loss=0.0855 + throughput/total_tokens=305,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1591/500000] + train/ActionL1Loss=0.1043 + throughput/total_tokens=305,472,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1592/500000] + train/ActionL1Loss=0.0957 + throughput/total_tokens=305,664,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1593/500000] + train/ActionL1Loss=0.0920 + throughput/total_tokens=305,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1594/500000] + train/ActionL1Loss=0.0930 + throughput/total_tokens=306,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1595/500000] + train/ActionL1Loss=0.0979 + throughput/total_tokens=306,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1596/500000] + train/ActionL1Loss=0.1004 + throughput/total_tokens=306,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1597/500000] + train/ActionL1Loss=0.0870 + throughput/total_tokens=306,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1598/500000] + train/ActionL1Loss=0.0789 + throughput/total_tokens=306,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1599/500000] + train/ActionL1Loss=0.0866 + throughput/total_tokens=307,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1600/500000] + optim/total_grad_norm=10.45 + train/ActionL1Loss=0.0686 + throughput/total_tokens=307,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1601/500000] + train/ActionL1Loss=0.0656 + throughput/total_tokens=307,392,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1602/500000] + train/ActionL1Loss=0.0905 + throughput/total_tokens=307,584,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1603/500000] + train/ActionL1Loss=0.0898 + throughput/total_tokens=307,776,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1604/500000] + train/ActionL1Loss=0.0870 + throughput/total_tokens=307,968,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1605/500000] + train/ActionL1Loss=0.1082 + throughput/total_tokens=308,160,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1606/500000] + train/ActionL1Loss=0.0910 + throughput/total_tokens=308,352,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1607/500000] + train/ActionL1Loss=0.0840 + throughput/total_tokens=308,544,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1608/500000] + train/ActionL1Loss=0.0830 + throughput/total_tokens=308,736,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1609/500000] + train/ActionL1Loss=0.0875 + throughput/total_tokens=308,928,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1610/500000] + train/ActionL1Loss=0.0945 + throughput/total_tokens=309,120,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1611/500000] + train/ActionL1Loss=0.0905 + throughput/total_tokens=309,312,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1612/500000] + train/ActionL1Loss=0.0913 + throughput/total_tokens=309,504,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1613/500000] + train/ActionL1Loss=0.0836 + throughput/total_tokens=309,696,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1614/500000] + train/ActionL1Loss=0.0780 + throughput/total_tokens=309,888,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1615/500000] + train/ActionL1Loss=0.0985 + throughput/total_tokens=310,080,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1616/500000] + train/ActionL1Loss=0.0806 + throughput/total_tokens=310,272,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1617/500000] + train/ActionL1Loss=0.0912 + throughput/total_tokens=310,464,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1618/500000] + train/ActionL1Loss=0.0789 + throughput/total_tokens=310,656,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1619/500000] + train/ActionL1Loss=0.0907 + throughput/total_tokens=310,848,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1620/500000] + optim/total_grad_norm=9.458 + train/ActionL1Loss=0.0733 + throughput/total_tokens=311,040,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=1621/500000] + train/ActionL1Loss=0.0986 + throughput/total_tokens=311,232,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=1622/500000] + train/ActionL1Loss=0.1041 + throughput/total_tokens=311,424,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=1623/500000] + train/ActionL1Loss=0.0910 + throughput/total_tokens=311,616,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=1624/500000] + train/ActionL1Loss=0.0823 + throughput/total_tokens=311,808,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=1625/500000] + train/ActionL1Loss=0.0778 + throughput/total_tokens=312,000,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1626/500000] + train/ActionL1Loss=0.0768 + throughput/total_tokens=312,192,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1627/500000] + train/ActionL1Loss=0.0821 + throughput/total_tokens=312,384,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1628/500000] + train/ActionL1Loss=0.0922 + throughput/total_tokens=312,576,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1629/500000] + train/ActionL1Loss=0.0745 + throughput/total_tokens=312,768,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1630/500000] + train/ActionL1Loss=0.0939 + throughput/total_tokens=312,960,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1631/500000] + train/ActionL1Loss=0.0962 + throughput/total_tokens=313,152,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1632/500000] + train/ActionL1Loss=0.0918 + throughput/total_tokens=313,344,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1633/500000] + train/ActionL1Loss=0.0881 + throughput/total_tokens=313,536,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1634/500000] + train/ActionL1Loss=0.0874 + throughput/total_tokens=313,728,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1635/500000] + train/ActionL1Loss=0.0861 + throughput/total_tokens=313,920,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1636/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=314,112,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1637/500000] + train/ActionL1Loss=0.1014 + throughput/total_tokens=314,304,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1638/500000] + train/ActionL1Loss=0.0969 + throughput/total_tokens=314,496,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1639/500000] + train/ActionL1Loss=0.1030 + throughput/total_tokens=314,688,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1640/500000] + optim/total_grad_norm=10.31 + train/ActionL1Loss=0.0989 + throughput/total_tokens=314,880,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1641/500000] + train/ActionL1Loss=0.0817 + throughput/total_tokens=315,072,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1642/500000] + train/ActionL1Loss=0.0901 + throughput/total_tokens=315,264,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1643/500000] + train/ActionL1Loss=0.0789 + throughput/total_tokens=315,456,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1644/500000] + train/ActionL1Loss=0.0822 + throughput/total_tokens=315,648,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1645/500000] + train/ActionL1Loss=0.0685 + throughput/total_tokens=315,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1646/500000] + train/ActionL1Loss=0.0913 + throughput/total_tokens=316,032,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1647/500000] + train/ActionL1Loss=0.0788 + throughput/total_tokens=316,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1648/500000] + train/ActionL1Loss=0.0956 + throughput/total_tokens=316,416,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1649/500000] + train/ActionL1Loss=0.0920 + throughput/total_tokens=316,608,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1650/500000] + train/ActionL1Loss=0.0772 + throughput/total_tokens=316,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1651/500000] + train/ActionL1Loss=0.0926 + throughput/total_tokens=316,992,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1652/500000] + train/ActionL1Loss=0.0686 + throughput/total_tokens=317,184,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1653/500000] + train/ActionL1Loss=0.0759 + throughput/total_tokens=317,376,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1654/500000] + train/ActionL1Loss=0.0698 + throughput/total_tokens=317,568,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1655/500000] + train/ActionL1Loss=0.0865 + throughput/total_tokens=317,760,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1656/500000] + train/ActionL1Loss=0.0848 + throughput/total_tokens=317,952,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1657/500000] + train/ActionL1Loss=0.0898 + throughput/total_tokens=318,144,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1658/500000] + train/ActionL1Loss=0.0686 + throughput/total_tokens=318,336,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1659/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=318,528,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1660/500000] + optim/total_grad_norm=9.942 + train/ActionL1Loss=0.0902 + throughput/total_tokens=318,720,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=1661/500000] + train/ActionL1Loss=0.0866 + throughput/total_tokens=318,912,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1662/500000] + train/ActionL1Loss=0.0840 + throughput/total_tokens=319,104,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1663/500000] + train/ActionL1Loss=0.0674 + throughput/total_tokens=319,296,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=1664/500000] + train/ActionL1Loss=0.0891 + throughput/total_tokens=319,488,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1665/500000] + train/ActionL1Loss=0.0922 + throughput/total_tokens=319,680,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1666/500000] + train/ActionL1Loss=0.0810 + throughput/total_tokens=319,872,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1667/500000] + train/ActionL1Loss=0.0745 + throughput/total_tokens=320,064,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1668/500000] + train/ActionL1Loss=0.0852 + throughput/total_tokens=320,256,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=1669/500000] + train/ActionL1Loss=0.0819 + throughput/total_tokens=320,448,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=1670/500000] + train/ActionL1Loss=0.0832 + throughput/total_tokens=320,640,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1671/500000] + train/ActionL1Loss=0.0819 + throughput/total_tokens=320,832,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1672/500000] + train/ActionL1Loss=0.0787 + throughput/total_tokens=321,024,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1673/500000] + train/ActionL1Loss=0.0881 + throughput/total_tokens=321,216,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1674/500000] + train/ActionL1Loss=0.0759 + throughput/total_tokens=321,408,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1675/500000] + train/ActionL1Loss=0.0733 + throughput/total_tokens=321,600,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1676/500000] + train/ActionL1Loss=0.0852 + throughput/total_tokens=321,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1677/500000] + train/ActionL1Loss=0.1033 + throughput/total_tokens=321,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1678/500000] + train/ActionL1Loss=0.0808 + throughput/total_tokens=322,176,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1679/500000] + train/ActionL1Loss=0.0797 + throughput/total_tokens=322,368,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1680/500000] + optim/total_grad_norm=9.265 + train/ActionL1Loss=0.0990 + throughput/total_tokens=322,560,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1681/500000] + train/ActionL1Loss=0.0756 + throughput/total_tokens=322,752,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1682/500000] + train/ActionL1Loss=0.0932 + throughput/total_tokens=322,944,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1683/500000] + train/ActionL1Loss=0.0918 + throughput/total_tokens=323,136,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1684/500000] + train/ActionL1Loss=0.0833 + throughput/total_tokens=323,328,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1685/500000] + train/ActionL1Loss=0.0915 + throughput/total_tokens=323,520,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1686/500000] + train/ActionL1Loss=0.0932 + throughput/total_tokens=323,712,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1687/500000] + train/ActionL1Loss=0.0877 + throughput/total_tokens=323,904,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1688/500000] + train/ActionL1Loss=0.0821 + throughput/total_tokens=324,096,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1689/500000] + train/ActionL1Loss=0.0994 + throughput/total_tokens=324,288,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1690/500000] + train/ActionL1Loss=0.0847 + throughput/total_tokens=324,480,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1691/500000] + train/ActionL1Loss=0.0897 + throughput/total_tokens=324,672,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1692/500000] + train/ActionL1Loss=0.0933 + throughput/total_tokens=324,864,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1693/500000] + train/ActionL1Loss=0.0976 + throughput/total_tokens=325,056,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1694/500000] + train/ActionL1Loss=0.1076 + throughput/total_tokens=325,248,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1695/500000] + train/ActionL1Loss=0.0825 + throughput/total_tokens=325,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1696/500000] + train/ActionL1Loss=0.0726 + throughput/total_tokens=325,632,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1697/500000] + train/ActionL1Loss=0.0951 + throughput/total_tokens=325,824,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1698/500000] + train/ActionL1Loss=0.0725 + throughput/total_tokens=326,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1699/500000] + train/ActionL1Loss=0.0702 + throughput/total_tokens=326,208,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1700/500000] + optim/total_grad_norm=10.69 + train/ActionL1Loss=0.0794 + throughput/total_tokens=326,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1701/500000] + train/ActionL1Loss=0.0815 + throughput/total_tokens=326,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1702/500000] + train/ActionL1Loss=0.0872 + throughput/total_tokens=326,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1703/500000] + train/ActionL1Loss=0.1003 + throughput/total_tokens=326,976,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1704/500000] + train/ActionL1Loss=0.1000 + throughput/total_tokens=327,168,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1705/500000] + train/ActionL1Loss=0.0873 + throughput/total_tokens=327,360,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1706/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=327,552,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1707/500000] + train/ActionL1Loss=0.0743 + throughput/total_tokens=327,744,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1708/500000] + train/ActionL1Loss=0.0917 + throughput/total_tokens=327,936,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1709/500000] + train/ActionL1Loss=0.0744 + throughput/total_tokens=328,128,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1710/500000] + train/ActionL1Loss=0.0945 + throughput/total_tokens=328,320,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1711/500000] + train/ActionL1Loss=0.0859 + throughput/total_tokens=328,512,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1712/500000] + train/ActionL1Loss=0.0788 + throughput/total_tokens=328,704,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1713/500000] + train/ActionL1Loss=0.0908 + throughput/total_tokens=328,896,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1714/500000] + train/ActionL1Loss=0.0783 + throughput/total_tokens=329,088,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1715/500000] + train/ActionL1Loss=0.0797 + throughput/total_tokens=329,280,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1716/500000] + train/ActionL1Loss=0.0766 + throughput/total_tokens=329,472,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1717/500000] + train/ActionL1Loss=0.0742 + throughput/total_tokens=329,664,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1718/500000] + train/ActionL1Loss=0.0689 + throughput/total_tokens=329,856,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1719/500000] + train/ActionL1Loss=0.0800 + throughput/total_tokens=330,048,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1720/500000] + optim/total_grad_norm=9.968 + train/ActionL1Loss=0.0918 + throughput/total_tokens=330,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1721/500000] + train/ActionL1Loss=0.0773 + throughput/total_tokens=330,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1722/500000] + train/ActionL1Loss=0.0883 + throughput/total_tokens=330,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1723/500000] + train/ActionL1Loss=0.0772 + throughput/total_tokens=330,816,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1724/500000] + train/ActionL1Loss=0.0732 + throughput/total_tokens=331,008,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1725/500000] + train/ActionL1Loss=0.0812 + throughput/total_tokens=331,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1726/500000] + train/ActionL1Loss=0.0807 + throughput/total_tokens=331,392,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1727/500000] + train/ActionL1Loss=0.0707 + throughput/total_tokens=331,584,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1728/500000] + train/ActionL1Loss=0.0820 + throughput/total_tokens=331,776,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1729/500000] + train/ActionL1Loss=0.0839 + throughput/total_tokens=331,968,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1730/500000] + train/ActionL1Loss=0.0751 + throughput/total_tokens=332,160,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1731/500000] + train/ActionL1Loss=0.0842 + throughput/total_tokens=332,352,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1732/500000] + train/ActionL1Loss=0.0982 + throughput/total_tokens=332,544,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1733/500000] + train/ActionL1Loss=0.0815 + throughput/total_tokens=332,736,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1734/500000] + train/ActionL1Loss=0.0906 + throughput/total_tokens=332,928,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1735/500000] + train/ActionL1Loss=0.0775 + throughput/total_tokens=333,120,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1736/500000] + train/ActionL1Loss=0.0967 + throughput/total_tokens=333,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1737/500000] + train/ActionL1Loss=0.0667 + throughput/total_tokens=333,504,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1738/500000] + train/ActionL1Loss=0.0915 + throughput/total_tokens=333,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1739/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=333,888,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1740/500000] + optim/total_grad_norm=10.53 + train/ActionL1Loss=0.0885 + throughput/total_tokens=334,080,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1741/500000] + train/ActionL1Loss=0.0871 + throughput/total_tokens=334,272,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1742/500000] + train/ActionL1Loss=0.0780 + throughput/total_tokens=334,464,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1743/500000] + train/ActionL1Loss=0.0917 + throughput/total_tokens=334,656,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1744/500000] + train/ActionL1Loss=0.0647 + throughput/total_tokens=334,848,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1745/500000] + train/ActionL1Loss=0.0791 + throughput/total_tokens=335,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1746/500000] + train/ActionL1Loss=0.0872 + throughput/total_tokens=335,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1747/500000] + train/ActionL1Loss=0.0710 + throughput/total_tokens=335,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1748/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=335,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1749/500000] + train/ActionL1Loss=0.0812 + throughput/total_tokens=335,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1750/500000] + train/ActionL1Loss=0.0903 + throughput/total_tokens=336,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1751/500000] + train/ActionL1Loss=0.0779 + throughput/total_tokens=336,192,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1752/500000] + train/ActionL1Loss=0.0864 + throughput/total_tokens=336,384,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1753/500000] + train/ActionL1Loss=0.0858 + throughput/total_tokens=336,576,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1754/500000] + train/ActionL1Loss=0.0885 + throughput/total_tokens=336,768,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1755/500000] + train/ActionL1Loss=0.0998 + throughput/total_tokens=336,960,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1756/500000] + train/ActionL1Loss=0.1009 + throughput/total_tokens=337,152,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1757/500000] + train/ActionL1Loss=0.0791 + throughput/total_tokens=337,344,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1758/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=337,536,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1759/500000] + train/ActionL1Loss=0.0818 + throughput/total_tokens=337,728,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1760/500000] + optim/total_grad_norm=11.96 + train/ActionL1Loss=0.0983 + throughput/total_tokens=337,920,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1761/500000] + train/ActionL1Loss=0.0947 + throughput/total_tokens=338,112,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1762/500000] + train/ActionL1Loss=0.0905 + throughput/total_tokens=338,304,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1763/500000] + train/ActionL1Loss=0.0915 + throughput/total_tokens=338,496,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1764/500000] + train/ActionL1Loss=0.0876 + throughput/total_tokens=338,688,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1765/500000] + train/ActionL1Loss=0.0809 + throughput/total_tokens=338,880,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1766/500000] + train/ActionL1Loss=0.0809 + throughput/total_tokens=339,072,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1767/500000] + train/ActionL1Loss=0.0742 + throughput/total_tokens=339,264,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1768/500000] + train/ActionL1Loss=0.0790 + throughput/total_tokens=339,456,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1769/500000] + train/ActionL1Loss=0.0723 + throughput/total_tokens=339,648,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1770/500000] + train/ActionL1Loss=0.0858 + throughput/total_tokens=339,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1771/500000] + train/ActionL1Loss=0.0955 + throughput/total_tokens=340,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1772/500000] + train/ActionL1Loss=0.0951 + throughput/total_tokens=340,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1773/500000] + train/ActionL1Loss=0.0798 + throughput/total_tokens=340,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1774/500000] + train/ActionL1Loss=0.0782 + throughput/total_tokens=340,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1775/500000] + train/ActionL1Loss=0.0686 + throughput/total_tokens=340,800,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1776/500000] + train/ActionL1Loss=0.0772 + throughput/total_tokens=340,992,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1777/500000] + train/ActionL1Loss=0.0875 + throughput/total_tokens=341,184,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1778/500000] + train/ActionL1Loss=0.0768 + throughput/total_tokens=341,376,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1779/500000] + train/ActionL1Loss=0.0777 + throughput/total_tokens=341,568,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1780/500000] + optim/total_grad_norm=11.12 + train/ActionL1Loss=0.1011 + throughput/total_tokens=341,760,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1781/500000] + train/ActionL1Loss=0.0758 + throughput/total_tokens=341,952,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1782/500000] + train/ActionL1Loss=0.0875 + throughput/total_tokens=342,144,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1783/500000] + train/ActionL1Loss=0.0927 + throughput/total_tokens=342,336,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1784/500000] + train/ActionL1Loss=0.0763 + throughput/total_tokens=342,528,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1785/500000] + train/ActionL1Loss=0.0880 + throughput/total_tokens=342,720,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1786/500000] + train/ActionL1Loss=0.0727 + throughput/total_tokens=342,912,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1787/500000] + train/ActionL1Loss=0.0758 + throughput/total_tokens=343,104,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1788/500000] + train/ActionL1Loss=0.0672 + throughput/total_tokens=343,296,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1789/500000] + train/ActionL1Loss=0.0791 + throughput/total_tokens=343,488,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1790/500000] + train/ActionL1Loss=0.0990 + throughput/total_tokens=343,680,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1791/500000] + train/ActionL1Loss=0.0954 + throughput/total_tokens=343,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1792/500000] + train/ActionL1Loss=0.0886 + throughput/total_tokens=344,064,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1793/500000] + train/ActionL1Loss=0.0859 + throughput/total_tokens=344,256,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1794/500000] + train/ActionL1Loss=0.0862 + throughput/total_tokens=344,448,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1795/500000] + train/ActionL1Loss=0.0794 + throughput/total_tokens=344,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1796/500000] + train/ActionL1Loss=0.0787 + throughput/total_tokens=344,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1797/500000] + train/ActionL1Loss=0.0891 + throughput/total_tokens=345,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1798/500000] + train/ActionL1Loss=0.1026 + throughput/total_tokens=345,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1799/500000] + train/ActionL1Loss=0.0825 + throughput/total_tokens=345,408,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1800/500000] + optim/total_grad_norm=10.86 + train/ActionL1Loss=0.0782 + throughput/total_tokens=345,600,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1801/500000] + train/ActionL1Loss=0.0939 + throughput/total_tokens=345,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1802/500000] + train/ActionL1Loss=0.0798 + throughput/total_tokens=345,984,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1803/500000] + train/ActionL1Loss=0.0945 + throughput/total_tokens=346,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1804/500000] + train/ActionL1Loss=0.0924 + throughput/total_tokens=346,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1805/500000] + train/ActionL1Loss=0.0970 + throughput/total_tokens=346,560,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1806/500000] + train/ActionL1Loss=0.0930 + throughput/total_tokens=346,752,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1807/500000] + train/ActionL1Loss=0.0720 + throughput/total_tokens=346,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1808/500000] + train/ActionL1Loss=0.0903 + throughput/total_tokens=347,136,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1809/500000] + train/ActionL1Loss=0.0860 + throughput/total_tokens=347,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1810/500000] + train/ActionL1Loss=0.0860 + throughput/total_tokens=347,520,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1811/500000] + train/ActionL1Loss=0.0690 + throughput/total_tokens=347,712,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=1812/500000] + train/ActionL1Loss=0.0962 + throughput/total_tokens=347,904,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1813/500000] + train/ActionL1Loss=0.1099 + throughput/total_tokens=348,096,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1814/500000] + train/ActionL1Loss=0.0871 + throughput/total_tokens=348,288,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1815/500000] + train/ActionL1Loss=0.0926 + throughput/total_tokens=348,480,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1816/500000] + train/ActionL1Loss=0.0958 + throughput/total_tokens=348,672,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1817/500000] + train/ActionL1Loss=0.0815 + throughput/total_tokens=348,864,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1818/500000] + train/ActionL1Loss=0.0787 + throughput/total_tokens=349,056,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1819/500000] + train/ActionL1Loss=0.0978 + throughput/total_tokens=349,248,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1820/500000] + optim/total_grad_norm=10.02 + train/ActionL1Loss=0.0815 + throughput/total_tokens=349,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1821/500000] + train/ActionL1Loss=0.0911 + throughput/total_tokens=349,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1822/500000] + train/ActionL1Loss=0.0970 + throughput/total_tokens=349,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1823/500000] + train/ActionL1Loss=0.1047 + throughput/total_tokens=350,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1824/500000] + train/ActionL1Loss=0.0873 + throughput/total_tokens=350,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1825/500000] + train/ActionL1Loss=0.0904 + throughput/total_tokens=350,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1826/500000] + train/ActionL1Loss=0.0708 + throughput/total_tokens=350,592,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1827/500000] + train/ActionL1Loss=0.0690 + throughput/total_tokens=350,784,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1828/500000] + train/ActionL1Loss=0.0880 + throughput/total_tokens=350,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1829/500000] + train/ActionL1Loss=0.0841 + throughput/total_tokens=351,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1830/500000] + train/ActionL1Loss=0.0944 + throughput/total_tokens=351,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1831/500000] + train/ActionL1Loss=0.1021 + throughput/total_tokens=351,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1832/500000] + train/ActionL1Loss=0.0798 + throughput/total_tokens=351,744,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1833/500000] + train/ActionL1Loss=0.0910 + throughput/total_tokens=351,936,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1834/500000] + train/ActionL1Loss=0.1021 + throughput/total_tokens=352,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1835/500000] + train/ActionL1Loss=0.0974 + throughput/total_tokens=352,320,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1836/500000] + train/ActionL1Loss=0.0809 + throughput/total_tokens=352,512,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1837/500000] + train/ActionL1Loss=0.0881 + throughput/total_tokens=352,704,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1838/500000] + train/ActionL1Loss=0.1042 + throughput/total_tokens=352,896,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1839/500000] + train/ActionL1Loss=0.0959 + throughput/total_tokens=353,088,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1840/500000] + optim/total_grad_norm=10.69 + train/ActionL1Loss=0.1047 + throughput/total_tokens=353,280,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1841/500000] + train/ActionL1Loss=0.1026 + throughput/total_tokens=353,472,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1842/500000] + train/ActionL1Loss=0.0974 + throughput/total_tokens=353,664,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1843/500000] + train/ActionL1Loss=0.0991 + throughput/total_tokens=353,856,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1844/500000] + train/ActionL1Loss=0.0844 + throughput/total_tokens=354,048,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1845/500000] + train/ActionL1Loss=0.0779 + throughput/total_tokens=354,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1846/500000] + train/ActionL1Loss=0.0740 + throughput/total_tokens=354,432,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1847/500000] + train/ActionL1Loss=0.0925 + throughput/total_tokens=354,624,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1848/500000] + train/ActionL1Loss=0.0753 + throughput/total_tokens=354,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1849/500000] + train/ActionL1Loss=0.0918 + throughput/total_tokens=355,008,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=1850/500000] + train/ActionL1Loss=0.0774 + throughput/total_tokens=355,200,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1851/500000] + train/ActionL1Loss=0.0849 + throughput/total_tokens=355,392,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1852/500000] + train/ActionL1Loss=0.0639 + throughput/total_tokens=355,584,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1853/500000] + train/ActionL1Loss=0.0944 + throughput/total_tokens=355,776,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1854/500000] + train/ActionL1Loss=0.0855 + throughput/total_tokens=355,968,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1855/500000] + train/ActionL1Loss=0.0824 + throughput/total_tokens=356,160,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1856/500000] + train/ActionL1Loss=0.0878 + throughput/total_tokens=356,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1857/500000] + train/ActionL1Loss=0.0905 + throughput/total_tokens=356,544,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1858/500000] + train/ActionL1Loss=0.0838 + throughput/total_tokens=356,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1859/500000] + train/ActionL1Loss=0.0782 + throughput/total_tokens=356,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1860/500000] + optim/total_grad_norm=10.15 + train/ActionL1Loss=0.0799 + throughput/total_tokens=357,120,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1861/500000] + train/ActionL1Loss=0.0808 + throughput/total_tokens=357,312,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1862/500000] + train/ActionL1Loss=0.0800 + throughput/total_tokens=357,504,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=1863/500000] + train/ActionL1Loss=0.0928 + throughput/total_tokens=357,696,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1864/500000] + train/ActionL1Loss=0.0985 + throughput/total_tokens=357,888,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1865/500000] + train/ActionL1Loss=0.0906 + throughput/total_tokens=358,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1866/500000] + train/ActionL1Loss=0.1056 + throughput/total_tokens=358,272,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1867/500000] + train/ActionL1Loss=0.0951 + throughput/total_tokens=358,464,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1868/500000] + train/ActionL1Loss=0.0967 + throughput/total_tokens=358,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1869/500000] + train/ActionL1Loss=0.0857 + throughput/total_tokens=358,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1870/500000] + train/ActionL1Loss=0.0845 + throughput/total_tokens=359,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1871/500000] + train/ActionL1Loss=0.0934 + throughput/total_tokens=359,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1872/500000] + train/ActionL1Loss=0.0733 + throughput/total_tokens=359,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1873/500000] + train/ActionL1Loss=0.0872 + throughput/total_tokens=359,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1874/500000] + train/ActionL1Loss=0.0907 + throughput/total_tokens=359,808,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1875/500000] + train/ActionL1Loss=0.1010 + throughput/total_tokens=360,000,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1876/500000] + train/ActionL1Loss=0.0987 + throughput/total_tokens=360,192,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1877/500000] + train/ActionL1Loss=0.0823 + throughput/total_tokens=360,384,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1878/500000] + train/ActionL1Loss=0.0845 + throughput/total_tokens=360,576,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1879/500000] + train/ActionL1Loss=0.0774 + throughput/total_tokens=360,768,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=1880/500000] + optim/total_grad_norm=10.13 + train/ActionL1Loss=0.0709 + throughput/total_tokens=360,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=1881/500000] + train/ActionL1Loss=0.0987 + throughput/total_tokens=361,152,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=1882/500000] + train/ActionL1Loss=0.0788 + throughput/total_tokens=361,344,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1883/500000] + train/ActionL1Loss=0.0932 + throughput/total_tokens=361,536,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1884/500000] + train/ActionL1Loss=0.1082 + throughput/total_tokens=361,728,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1885/500000] + train/ActionL1Loss=0.0959 + throughput/total_tokens=361,920,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1886/500000] + train/ActionL1Loss=0.1000 + throughput/total_tokens=362,112,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1887/500000] + train/ActionL1Loss=0.0728 + throughput/total_tokens=362,304,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1888/500000] + train/ActionL1Loss=0.0802 + throughput/total_tokens=362,496,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1889/500000] + train/ActionL1Loss=0.1044 + throughput/total_tokens=362,688,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1890/500000] + train/ActionL1Loss=0.0885 + throughput/total_tokens=362,880,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1891/500000] + train/ActionL1Loss=0.0949 + throughput/total_tokens=363,072,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1892/500000] + train/ActionL1Loss=0.0906 + throughput/total_tokens=363,264,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1893/500000] + train/ActionL1Loss=0.0907 + throughput/total_tokens=363,456,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1894/500000] + train/ActionL1Loss=0.0888 + throughput/total_tokens=363,648,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1895/500000] + train/ActionL1Loss=0.0915 + throughput/total_tokens=363,840,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1896/500000] + train/ActionL1Loss=0.0902 + throughput/total_tokens=364,032,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1897/500000] + train/ActionL1Loss=0.1053 + throughput/total_tokens=364,224,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1898/500000] + train/ActionL1Loss=0.1100 + throughput/total_tokens=364,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1899/500000] + train/ActionL1Loss=0.0813 + throughput/total_tokens=364,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=1900/500000] + optim/total_grad_norm=8.711 + train/ActionL1Loss=0.0883 + throughput/total_tokens=364,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1901/500000] + train/ActionL1Loss=0.1039 + throughput/total_tokens=364,992,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1902/500000] + train/ActionL1Loss=0.0944 + throughput/total_tokens=365,184,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1903/500000] + train/ActionL1Loss=0.0741 + throughput/total_tokens=365,376,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1904/500000] + train/ActionL1Loss=0.0879 + throughput/total_tokens=365,568,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1905/500000] + train/ActionL1Loss=0.0940 + throughput/total_tokens=365,760,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1906/500000] + train/ActionL1Loss=0.1039 + throughput/total_tokens=365,952,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1907/500000] + train/ActionL1Loss=0.0911 + throughput/total_tokens=366,144,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1908/500000] + train/ActionL1Loss=0.0929 + throughput/total_tokens=366,336,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1909/500000] + train/ActionL1Loss=0.0788 + throughput/total_tokens=366,528,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1910/500000] + train/ActionL1Loss=0.0891 + throughput/total_tokens=366,720,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1911/500000] + train/ActionL1Loss=0.0822 + throughput/total_tokens=366,912,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1912/500000] + train/ActionL1Loss=0.0827 + throughput/total_tokens=367,104,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1913/500000] + train/ActionL1Loss=0.0781 + throughput/total_tokens=367,296,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1914/500000] + train/ActionL1Loss=0.0821 + throughput/total_tokens=367,488,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1915/500000] + train/ActionL1Loss=0.0928 + throughput/total_tokens=367,680,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1916/500000] + train/ActionL1Loss=0.1019 + throughput/total_tokens=367,872,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1917/500000] + train/ActionL1Loss=0.0989 + throughput/total_tokens=368,064,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1918/500000] + train/ActionL1Loss=0.0912 + throughput/total_tokens=368,256,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1919/500000] + train/ActionL1Loss=0.0773 + throughput/total_tokens=368,448,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1920/500000] + optim/total_grad_norm=8.486 + train/ActionL1Loss=0.0802 + throughput/total_tokens=368,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=1921/500000] + train/ActionL1Loss=0.0775 + throughput/total_tokens=368,832,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1922/500000] + train/ActionL1Loss=0.0874 + throughput/total_tokens=369,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1923/500000] + train/ActionL1Loss=0.0785 + throughput/total_tokens=369,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=1924/500000] + train/ActionL1Loss=0.0839 + throughput/total_tokens=369,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1925/500000] + train/ActionL1Loss=0.0792 + throughput/total_tokens=369,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1926/500000] + train/ActionL1Loss=0.0760 + throughput/total_tokens=369,792,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=1927/500000] + train/ActionL1Loss=0.0779 + throughput/total_tokens=369,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1928/500000] + train/ActionL1Loss=0.0600 + throughput/total_tokens=370,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1929/500000] + train/ActionL1Loss=0.0733 + throughput/total_tokens=370,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1930/500000] + train/ActionL1Loss=0.0704 + throughput/total_tokens=370,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1931/500000] + train/ActionL1Loss=0.0684 + throughput/total_tokens=370,752,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1932/500000] + train/ActionL1Loss=0.0743 + throughput/total_tokens=370,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1933/500000] + train/ActionL1Loss=0.0695 + throughput/total_tokens=371,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1934/500000] + train/ActionL1Loss=0.0726 + throughput/total_tokens=371,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1935/500000] + train/ActionL1Loss=0.0769 + throughput/total_tokens=371,520,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1936/500000] + train/ActionL1Loss=0.0742 + throughput/total_tokens=371,712,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1937/500000] + train/ActionL1Loss=0.0674 + throughput/total_tokens=371,904,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1938/500000] + train/ActionL1Loss=0.0791 + throughput/total_tokens=372,096,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1939/500000] + train/ActionL1Loss=0.0788 + throughput/total_tokens=372,288,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1940/500000] + optim/total_grad_norm=10.62 + train/ActionL1Loss=0.0709 + throughput/total_tokens=372,480,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1941/500000] + train/ActionL1Loss=0.0840 + throughput/total_tokens=372,672,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1942/500000] + train/ActionL1Loss=0.0826 + throughput/total_tokens=372,864,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1943/500000] + train/ActionL1Loss=0.0926 + throughput/total_tokens=373,056,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1944/500000] + train/ActionL1Loss=0.0780 + throughput/total_tokens=373,248,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1945/500000] + train/ActionL1Loss=0.0668 + throughput/total_tokens=373,440,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1946/500000] + train/ActionL1Loss=0.0764 + throughput/total_tokens=373,632,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1947/500000] + train/ActionL1Loss=0.0868 + throughput/total_tokens=373,824,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1948/500000] + train/ActionL1Loss=0.0774 + throughput/total_tokens=374,016,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1949/500000] + train/ActionL1Loss=0.0812 + throughput/total_tokens=374,208,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1950/500000] + train/ActionL1Loss=0.0786 + throughput/total_tokens=374,400,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1951/500000] + train/ActionL1Loss=0.0865 + throughput/total_tokens=374,592,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1952/500000] + train/ActionL1Loss=0.0816 + throughput/total_tokens=374,784,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1953/500000] + train/ActionL1Loss=0.0760 + throughput/total_tokens=374,976,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1954/500000] + train/ActionL1Loss=0.0870 + throughput/total_tokens=375,168,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1955/500000] + train/ActionL1Loss=0.0805 + throughput/total_tokens=375,360,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1956/500000] + train/ActionL1Loss=0.0694 + throughput/total_tokens=375,552,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1957/500000] + train/ActionL1Loss=0.0982 + throughput/total_tokens=375,744,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1958/500000] + train/ActionL1Loss=0.0722 + throughput/total_tokens=375,936,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1959/500000] + train/ActionL1Loss=0.0752 + throughput/total_tokens=376,128,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=1960/500000] + optim/total_grad_norm=9.992 + train/ActionL1Loss=0.0859 + throughput/total_tokens=376,320,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=1961/500000] + train/ActionL1Loss=0.0786 + throughput/total_tokens=376,512,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1962/500000] + train/ActionL1Loss=0.0851 + throughput/total_tokens=376,704,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1963/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=376,896,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1964/500000] + train/ActionL1Loss=0.0790 + throughput/total_tokens=377,088,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1965/500000] + train/ActionL1Loss=0.0680 + throughput/total_tokens=377,280,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1966/500000] + train/ActionL1Loss=0.0724 + throughput/total_tokens=377,472,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1967/500000] + train/ActionL1Loss=0.0738 + throughput/total_tokens=377,664,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1968/500000] + train/ActionL1Loss=0.0650 + throughput/total_tokens=377,856,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1969/500000] + train/ActionL1Loss=0.0641 + throughput/total_tokens=378,048,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=1970/500000] + train/ActionL1Loss=0.0830 + throughput/total_tokens=378,240,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1971/500000] + train/ActionL1Loss=0.0831 + throughput/total_tokens=378,432,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1972/500000] + train/ActionL1Loss=0.0836 + throughput/total_tokens=378,624,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=1973/500000] + train/ActionL1Loss=0.0803 + throughput/total_tokens=378,816,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1974/500000] + train/ActionL1Loss=0.0709 + throughput/total_tokens=379,008,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1975/500000] + train/ActionL1Loss=0.0825 + throughput/total_tokens=379,200,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1976/500000] + train/ActionL1Loss=0.0829 + throughput/total_tokens=379,392,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1977/500000] + train/ActionL1Loss=0.0770 + throughput/total_tokens=379,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1978/500000] + train/ActionL1Loss=0.0626 + throughput/total_tokens=379,776,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1979/500000] + train/ActionL1Loss=0.0683 + throughput/total_tokens=379,968,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1980/500000] + optim/total_grad_norm=9.666 + train/ActionL1Loss=0.0798 + throughput/total_tokens=380,160,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1981/500000] + train/ActionL1Loss=0.0805 + throughput/total_tokens=380,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1982/500000] + train/ActionL1Loss=0.0622 + throughput/total_tokens=380,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1983/500000] + train/ActionL1Loss=0.0759 + throughput/total_tokens=380,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1984/500000] + train/ActionL1Loss=0.0729 + throughput/total_tokens=380,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1985/500000] + train/ActionL1Loss=0.0819 + throughput/total_tokens=381,120,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1986/500000] + train/ActionL1Loss=0.0797 + throughput/total_tokens=381,312,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1987/500000] + train/ActionL1Loss=0.0711 + throughput/total_tokens=381,504,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1988/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=381,696,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1989/500000] + train/ActionL1Loss=0.0916 + throughput/total_tokens=381,888,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1990/500000] + train/ActionL1Loss=0.0774 + throughput/total_tokens=382,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=1991/500000] + train/ActionL1Loss=0.0607 + throughput/total_tokens=382,272,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1992/500000] + train/ActionL1Loss=0.0862 + throughput/total_tokens=382,464,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1993/500000] + train/ActionL1Loss=0.0912 + throughput/total_tokens=382,656,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1994/500000] + train/ActionL1Loss=0.0669 + throughput/total_tokens=382,848,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1995/500000] + train/ActionL1Loss=0.0888 + throughput/total_tokens=383,040,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=1996/500000] + train/ActionL1Loss=0.1084 + throughput/total_tokens=383,232,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1997/500000] + train/ActionL1Loss=0.0783 + throughput/total_tokens=383,424,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1998/500000] + train/ActionL1Loss=0.0750 + throughput/total_tokens=383,616,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=1999/500000] + train/ActionL1Loss=0.0755 + throughput/total_tokens=383,808,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2000/500000] + optim/total_grad_norm=10.02 + train/ActionL1Loss=0.0846 + throughput/total_tokens=384,000,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +10/12 [04:15:35] INFO | >> Saving config... checkpoint.py:608 +10/12 [04:16:30] INFO | >> Saving model state... checkpoint.py:796 +10/12 [04:17:40] INFO | >> Saving optim state... checkpoint.py:811 +10/12 [04:19:13] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=2001/500000] + train/ActionL1Loss=0.0834 + throughput/total_tokens=384,192,000 + throughput/device/tokens_per_second=1,211 + throughput/device/batches_per_second=0.0505 +[step=2002/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=384,384,000 + throughput/device/tokens_per_second=1,186 + throughput/device/batches_per_second=0.0495 +[step=2003/500000] + train/ActionL1Loss=0.0905 + throughput/total_tokens=384,576,000 + throughput/device/tokens_per_second=1,185 + throughput/device/batches_per_second=0.0494 +[step=2004/500000] + train/ActionL1Loss=0.1105 + throughput/total_tokens=384,768,000 + throughput/device/tokens_per_second=1,186 + throughput/device/batches_per_second=0.0494 +[step=2005/500000] + train/ActionL1Loss=0.0785 + throughput/total_tokens=384,960,000 + throughput/device/tokens_per_second=1,184 + throughput/device/batches_per_second=0.0494 +[step=2006/500000] + train/ActionL1Loss=0.0759 + throughput/total_tokens=385,152,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=2007/500000] + train/ActionL1Loss=0.0922 + throughput/total_tokens=385,344,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2008/500000] + train/ActionL1Loss=0.0823 + throughput/total_tokens=385,536,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2009/500000] + train/ActionL1Loss=0.0874 + throughput/total_tokens=385,728,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2010/500000] + train/ActionL1Loss=0.0844 + throughput/total_tokens=385,920,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2011/500000] + train/ActionL1Loss=0.0757 + throughput/total_tokens=386,112,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2012/500000] + train/ActionL1Loss=0.0707 + throughput/total_tokens=386,304,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2013/500000] + train/ActionL1Loss=0.0784 + throughput/total_tokens=386,496,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2014/500000] + train/ActionL1Loss=0.0788 + throughput/total_tokens=386,688,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2015/500000] + train/ActionL1Loss=0.0786 + throughput/total_tokens=386,880,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2016/500000] + train/ActionL1Loss=0.0646 + throughput/total_tokens=387,072,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2017/500000] + train/ActionL1Loss=0.0733 + throughput/total_tokens=387,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2018/500000] + train/ActionL1Loss=0.0696 + throughput/total_tokens=387,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2019/500000] + train/ActionL1Loss=0.0712 + throughput/total_tokens=387,648,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2020/500000] + optim/total_grad_norm=10.42 + train/ActionL1Loss=0.0754 + throughput/total_tokens=387,840,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2021/500000] + train/ActionL1Loss=0.0830 + throughput/total_tokens=388,032,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2022/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=388,224,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2023/500000] + train/ActionL1Loss=0.0791 + throughput/total_tokens=388,416,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2024/500000] + train/ActionL1Loss=0.0828 + throughput/total_tokens=388,608,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2025/500000] + train/ActionL1Loss=0.0845 + throughput/total_tokens=388,800,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2026/500000] + train/ActionL1Loss=0.0764 + throughput/total_tokens=388,992,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2027/500000] + train/ActionL1Loss=0.0850 + throughput/total_tokens=389,184,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2028/500000] + train/ActionL1Loss=0.0808 + throughput/total_tokens=389,376,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2029/500000] + train/ActionL1Loss=0.0860 + throughput/total_tokens=389,568,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2030/500000] + train/ActionL1Loss=0.0986 + throughput/total_tokens=389,760,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2031/500000] + train/ActionL1Loss=0.0872 + throughput/total_tokens=389,952,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2032/500000] + train/ActionL1Loss=0.0820 + throughput/total_tokens=390,144,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2033/500000] + train/ActionL1Loss=0.0891 + throughput/total_tokens=390,336,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2034/500000] + train/ActionL1Loss=0.0719 + throughput/total_tokens=390,528,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2035/500000] + train/ActionL1Loss=0.0742 + throughput/total_tokens=390,720,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2036/500000] + train/ActionL1Loss=0.0860 + throughput/total_tokens=390,912,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2037/500000] + train/ActionL1Loss=0.0838 + throughput/total_tokens=391,104,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2038/500000] + train/ActionL1Loss=0.0912 + throughput/total_tokens=391,296,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2039/500000] + train/ActionL1Loss=0.0779 + throughput/total_tokens=391,488,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2040/500000] + optim/total_grad_norm=9.260 + train/ActionL1Loss=0.0698 + throughput/total_tokens=391,680,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2041/500000] + train/ActionL1Loss=0.0912 + throughput/total_tokens=391,872,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2042/500000] + train/ActionL1Loss=0.0928 + throughput/total_tokens=392,064,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2043/500000] + train/ActionL1Loss=0.0896 + throughput/total_tokens=392,256,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2044/500000] + train/ActionL1Loss=0.0715 + throughput/total_tokens=392,448,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2045/500000] + train/ActionL1Loss=0.0855 + throughput/total_tokens=392,640,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2046/500000] + train/ActionL1Loss=0.0972 + throughput/total_tokens=392,832,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2047/500000] + train/ActionL1Loss=0.0870 + throughput/total_tokens=393,024,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2048/500000] + train/ActionL1Loss=0.0834 + throughput/total_tokens=393,216,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2049/500000] + train/ActionL1Loss=0.0846 + throughput/total_tokens=393,408,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2050/500000] + train/ActionL1Loss=0.0874 + throughput/total_tokens=393,600,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2051/500000] + train/ActionL1Loss=0.0923 + throughput/total_tokens=393,792,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2052/500000] + train/ActionL1Loss=0.0929 + throughput/total_tokens=393,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2053/500000] + train/ActionL1Loss=0.0796 + throughput/total_tokens=394,176,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2054/500000] + train/ActionL1Loss=0.0752 + throughput/total_tokens=394,368,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2055/500000] + train/ActionL1Loss=0.0783 + throughput/total_tokens=394,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2056/500000] + train/ActionL1Loss=0.0780 + throughput/total_tokens=394,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2057/500000] + train/ActionL1Loss=0.0800 + throughput/total_tokens=394,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2058/500000] + train/ActionL1Loss=0.0722 + throughput/total_tokens=395,136,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2059/500000] + train/ActionL1Loss=0.0915 + throughput/total_tokens=395,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2060/500000] + optim/total_grad_norm=11.05 + train/ActionL1Loss=0.0819 + throughput/total_tokens=395,520,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2061/500000] + train/ActionL1Loss=0.0895 + throughput/total_tokens=395,712,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2062/500000] + train/ActionL1Loss=0.0844 + throughput/total_tokens=395,904,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2063/500000] + train/ActionL1Loss=0.0644 + throughput/total_tokens=396,096,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2064/500000] + train/ActionL1Loss=0.0638 + throughput/total_tokens=396,288,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2065/500000] + train/ActionL1Loss=0.0661 + throughput/total_tokens=396,480,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2066/500000] + train/ActionL1Loss=0.0737 + throughput/total_tokens=396,672,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2067/500000] + train/ActionL1Loss=0.0875 + throughput/total_tokens=396,864,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2068/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=397,056,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2069/500000] + train/ActionL1Loss=0.0865 + throughput/total_tokens=397,248,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2070/500000] + train/ActionL1Loss=0.0839 + throughput/total_tokens=397,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2071/500000] + train/ActionL1Loss=0.0768 + throughput/total_tokens=397,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2072/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=397,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2073/500000] + train/ActionL1Loss=0.0691 + throughput/total_tokens=398,016,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2074/500000] + train/ActionL1Loss=0.0685 + throughput/total_tokens=398,208,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2075/500000] + train/ActionL1Loss=0.0731 + throughput/total_tokens=398,400,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2076/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=398,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2077/500000] + train/ActionL1Loss=0.0741 + throughput/total_tokens=398,784,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2078/500000] + train/ActionL1Loss=0.0854 + throughput/total_tokens=398,976,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2079/500000] + train/ActionL1Loss=0.0936 + throughput/total_tokens=399,168,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2080/500000] + optim/total_grad_norm=8.210 + train/ActionL1Loss=0.0608 + throughput/total_tokens=399,360,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2081/500000] + train/ActionL1Loss=0.0741 + throughput/total_tokens=399,552,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2082/500000] + train/ActionL1Loss=0.0693 + throughput/total_tokens=399,744,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2083/500000] + train/ActionL1Loss=0.0822 + throughput/total_tokens=399,936,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2084/500000] + train/ActionL1Loss=0.0772 + throughput/total_tokens=400,128,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2085/500000] + train/ActionL1Loss=0.0769 + throughput/total_tokens=400,320,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2086/500000] + train/ActionL1Loss=0.0858 + throughput/total_tokens=400,512,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2087/500000] + train/ActionL1Loss=0.0769 + throughput/total_tokens=400,704,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2088/500000] + train/ActionL1Loss=0.0890 + throughput/total_tokens=400,896,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2089/500000] + train/ActionL1Loss=0.0828 + throughput/total_tokens=401,088,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2090/500000] + train/ActionL1Loss=0.0693 + throughput/total_tokens=401,280,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2091/500000] + train/ActionL1Loss=0.0791 + throughput/total_tokens=401,472,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2092/500000] + train/ActionL1Loss=0.0790 + throughput/total_tokens=401,664,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2093/500000] + train/ActionL1Loss=0.0781 + throughput/total_tokens=401,856,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2094/500000] + train/ActionL1Loss=0.0673 + throughput/total_tokens=402,048,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2095/500000] + train/ActionL1Loss=0.0817 + throughput/total_tokens=402,240,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2096/500000] + train/ActionL1Loss=0.0749 + throughput/total_tokens=402,432,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2097/500000] + train/ActionL1Loss=0.0797 + throughput/total_tokens=402,624,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2098/500000] + train/ActionL1Loss=0.0836 + throughput/total_tokens=402,816,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2099/500000] + train/ActionL1Loss=0.0742 + throughput/total_tokens=403,008,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2100/500000] + optim/total_grad_norm=8.064 + train/ActionL1Loss=0.0632 + throughput/total_tokens=403,200,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2101/500000] + train/ActionL1Loss=0.0739 + throughput/total_tokens=403,392,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2102/500000] + train/ActionL1Loss=0.0733 + throughput/total_tokens=403,584,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2103/500000] + train/ActionL1Loss=0.0714 + throughput/total_tokens=403,776,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=2104/500000] + train/ActionL1Loss=0.0777 + throughput/total_tokens=403,968,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2105/500000] + train/ActionL1Loss=0.0682 + throughput/total_tokens=404,160,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2106/500000] + train/ActionL1Loss=0.0710 + throughput/total_tokens=404,352,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2107/500000] + train/ActionL1Loss=0.0735 + throughput/total_tokens=404,544,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2108/500000] + train/ActionL1Loss=0.0750 + throughput/total_tokens=404,736,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2109/500000] + train/ActionL1Loss=0.0666 + throughput/total_tokens=404,928,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2110/500000] + train/ActionL1Loss=0.0742 + throughput/total_tokens=405,120,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=2111/500000] + train/ActionL1Loss=0.0693 + throughput/total_tokens=405,312,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2112/500000] + train/ActionL1Loss=0.0844 + throughput/total_tokens=405,504,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2113/500000] + train/ActionL1Loss=0.0645 + throughput/total_tokens=405,696,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2114/500000] + train/ActionL1Loss=0.0820 + throughput/total_tokens=405,888,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2115/500000] + train/ActionL1Loss=0.0744 + throughput/total_tokens=406,080,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2116/500000] + train/ActionL1Loss=0.0907 + throughput/total_tokens=406,272,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2117/500000] + train/ActionL1Loss=0.0881 + throughput/total_tokens=406,464,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=2118/500000] + train/ActionL1Loss=0.0789 + throughput/total_tokens=406,656,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=2119/500000] + train/ActionL1Loss=0.0715 + throughput/total_tokens=406,848,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=2120/500000] + optim/total_grad_norm=9.379 + train/ActionL1Loss=0.0757 + throughput/total_tokens=407,040,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2121/500000] + train/ActionL1Loss=0.0759 + throughput/total_tokens=407,232,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2122/500000] + train/ActionL1Loss=0.0708 + throughput/total_tokens=407,424,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2123/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=407,616,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2124/500000] + train/ActionL1Loss=0.0802 + throughput/total_tokens=407,808,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2125/500000] + train/ActionL1Loss=0.0797 + throughput/total_tokens=408,000,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2126/500000] + train/ActionL1Loss=0.0828 + throughput/total_tokens=408,192,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2127/500000] + train/ActionL1Loss=0.0767 + throughput/total_tokens=408,384,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2128/500000] + train/ActionL1Loss=0.0761 + throughput/total_tokens=408,576,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2129/500000] + train/ActionL1Loss=0.0849 + throughput/total_tokens=408,768,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2130/500000] + train/ActionL1Loss=0.0725 + throughput/total_tokens=408,960,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2131/500000] + train/ActionL1Loss=0.0716 + throughput/total_tokens=409,152,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2132/500000] + train/ActionL1Loss=0.0706 + throughput/total_tokens=409,344,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2133/500000] + train/ActionL1Loss=0.0719 + throughput/total_tokens=409,536,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2134/500000] + train/ActionL1Loss=0.0899 + throughput/total_tokens=409,728,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2135/500000] + train/ActionL1Loss=0.0693 + throughput/total_tokens=409,920,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2136/500000] + train/ActionL1Loss=0.0947 + throughput/total_tokens=410,112,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2137/500000] + train/ActionL1Loss=0.0836 + throughput/total_tokens=410,304,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2138/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=410,496,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2139/500000] + train/ActionL1Loss=0.0714 + throughput/total_tokens=410,688,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2140/500000] + optim/total_grad_norm=11.01 + train/ActionL1Loss=0.0752 + throughput/total_tokens=410,880,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2141/500000] + train/ActionL1Loss=0.0739 + throughput/total_tokens=411,072,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2142/500000] + train/ActionL1Loss=0.0760 + throughput/total_tokens=411,264,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2143/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=411,456,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2144/500000] + train/ActionL1Loss=0.0710 + throughput/total_tokens=411,648,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2145/500000] + train/ActionL1Loss=0.0638 + throughput/total_tokens=411,840,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2146/500000] + train/ActionL1Loss=0.0685 + throughput/total_tokens=412,032,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2147/500000] + train/ActionL1Loss=0.0936 + throughput/total_tokens=412,224,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2148/500000] + train/ActionL1Loss=0.0765 + throughput/total_tokens=412,416,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2149/500000] + train/ActionL1Loss=0.0715 + throughput/total_tokens=412,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2150/500000] + train/ActionL1Loss=0.0722 + throughput/total_tokens=412,800,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2151/500000] + train/ActionL1Loss=0.0854 + throughput/total_tokens=412,992,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2152/500000] + train/ActionL1Loss=0.0870 + throughput/total_tokens=413,184,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2153/500000] + train/ActionL1Loss=0.0801 + throughput/total_tokens=413,376,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2154/500000] + train/ActionL1Loss=0.0787 + throughput/total_tokens=413,568,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2155/500000] + train/ActionL1Loss=0.0851 + throughput/total_tokens=413,760,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2156/500000] + train/ActionL1Loss=0.0815 + throughput/total_tokens=413,952,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2157/500000] + train/ActionL1Loss=0.0729 + throughput/total_tokens=414,144,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2158/500000] + train/ActionL1Loss=0.0760 + throughput/total_tokens=414,336,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2159/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=414,528,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2160/500000] + optim/total_grad_norm=8.127 + train/ActionL1Loss=0.0799 + throughput/total_tokens=414,720,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2161/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=414,912,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2162/500000] + train/ActionL1Loss=0.0781 + throughput/total_tokens=415,104,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2163/500000] + train/ActionL1Loss=0.0831 + throughput/total_tokens=415,296,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2164/500000] + train/ActionL1Loss=0.0752 + throughput/total_tokens=415,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2165/500000] + train/ActionL1Loss=0.0653 + throughput/total_tokens=415,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2166/500000] + train/ActionL1Loss=0.0648 + throughput/total_tokens=415,872,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2167/500000] + train/ActionL1Loss=0.0777 + throughput/total_tokens=416,064,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2168/500000] + train/ActionL1Loss=0.0784 + throughput/total_tokens=416,256,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2169/500000] + train/ActionL1Loss=0.0754 + throughput/total_tokens=416,448,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2170/500000] + train/ActionL1Loss=0.0673 + throughput/total_tokens=416,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2171/500000] + train/ActionL1Loss=0.0779 + throughput/total_tokens=416,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2172/500000] + train/ActionL1Loss=0.0746 + throughput/total_tokens=417,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2173/500000] + train/ActionL1Loss=0.0660 + throughput/total_tokens=417,216,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2174/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=417,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2175/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=417,600,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2176/500000] + train/ActionL1Loss=0.0909 + throughput/total_tokens=417,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2177/500000] + train/ActionL1Loss=0.0762 + throughput/total_tokens=417,984,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2178/500000] + train/ActionL1Loss=0.0697 + throughput/total_tokens=418,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2179/500000] + train/ActionL1Loss=0.0741 + throughput/total_tokens=418,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2180/500000] + optim/total_grad_norm=10.11 + train/ActionL1Loss=0.0869 + throughput/total_tokens=418,560,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2181/500000] + train/ActionL1Loss=0.0918 + throughput/total_tokens=418,752,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2182/500000] + train/ActionL1Loss=0.0880 + throughput/total_tokens=418,944,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2183/500000] + train/ActionL1Loss=0.0873 + throughput/total_tokens=419,136,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2184/500000] + train/ActionL1Loss=0.0816 + throughput/total_tokens=419,328,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2185/500000] + train/ActionL1Loss=0.0755 + throughput/total_tokens=419,520,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2186/500000] + train/ActionL1Loss=0.0762 + throughput/total_tokens=419,712,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2187/500000] + train/ActionL1Loss=0.0805 + throughput/total_tokens=419,904,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2188/500000] + train/ActionL1Loss=0.0796 + throughput/total_tokens=420,096,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2189/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=420,288,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2190/500000] + train/ActionL1Loss=0.0874 + throughput/total_tokens=420,480,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2191/500000] + train/ActionL1Loss=0.0750 + throughput/total_tokens=420,672,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2192/500000] + train/ActionL1Loss=0.0833 + throughput/total_tokens=420,864,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2193/500000] + train/ActionL1Loss=0.0703 + throughput/total_tokens=421,056,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2194/500000] + train/ActionL1Loss=0.0812 + throughput/total_tokens=421,248,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2195/500000] + train/ActionL1Loss=0.0678 + throughput/total_tokens=421,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2196/500000] + train/ActionL1Loss=0.0663 + throughput/total_tokens=421,632,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2197/500000] + train/ActionL1Loss=0.0645 + throughput/total_tokens=421,824,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2198/500000] + train/ActionL1Loss=0.0790 + throughput/total_tokens=422,016,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2199/500000] + train/ActionL1Loss=0.0879 + throughput/total_tokens=422,208,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2200/500000] + optim/total_grad_norm=10.85 + train/ActionL1Loss=0.0858 + throughput/total_tokens=422,400,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2201/500000] + train/ActionL1Loss=0.0884 + throughput/total_tokens=422,592,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2202/500000] + train/ActionL1Loss=0.0800 + throughput/total_tokens=422,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2203/500000] + train/ActionL1Loss=0.0788 + throughput/total_tokens=422,976,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2204/500000] + train/ActionL1Loss=0.0763 + throughput/total_tokens=423,168,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2205/500000] + train/ActionL1Loss=0.0867 + throughput/total_tokens=423,360,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2206/500000] + train/ActionL1Loss=0.0855 + throughput/total_tokens=423,552,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=2207/500000] + train/ActionL1Loss=0.0910 + throughput/total_tokens=423,744,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2208/500000] + train/ActionL1Loss=0.0781 + throughput/total_tokens=423,936,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2209/500000] + train/ActionL1Loss=0.0870 + throughput/total_tokens=424,128,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2210/500000] + train/ActionL1Loss=0.0727 + throughput/total_tokens=424,320,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2211/500000] + train/ActionL1Loss=0.0796 + throughput/total_tokens=424,512,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2212/500000] + train/ActionL1Loss=0.0734 + throughput/total_tokens=424,704,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2213/500000] + train/ActionL1Loss=0.0682 + throughput/total_tokens=424,896,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2214/500000] + train/ActionL1Loss=0.0671 + throughput/total_tokens=425,088,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2215/500000] + train/ActionL1Loss=0.0644 + throughput/total_tokens=425,280,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2216/500000] + train/ActionL1Loss=0.0740 + throughput/total_tokens=425,472,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2217/500000] + train/ActionL1Loss=0.0690 + throughput/total_tokens=425,664,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2218/500000] + train/ActionL1Loss=0.0740 + throughput/total_tokens=425,856,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2219/500000] + train/ActionL1Loss=0.0689 + throughput/total_tokens=426,048,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2220/500000] + optim/total_grad_norm=9.050 + train/ActionL1Loss=0.0746 + throughput/total_tokens=426,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2221/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=426,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2222/500000] + train/ActionL1Loss=0.0607 + throughput/total_tokens=426,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2223/500000] + train/ActionL1Loss=0.0785 + throughput/total_tokens=426,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2224/500000] + train/ActionL1Loss=0.0674 + throughput/total_tokens=427,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2225/500000] + train/ActionL1Loss=0.0756 + throughput/total_tokens=427,200,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2226/500000] + train/ActionL1Loss=0.0704 + throughput/total_tokens=427,392,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2227/500000] + train/ActionL1Loss=0.0857 + throughput/total_tokens=427,584,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2228/500000] + train/ActionL1Loss=0.0648 + throughput/total_tokens=427,776,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2229/500000] + train/ActionL1Loss=0.0675 + throughput/total_tokens=427,968,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2230/500000] + train/ActionL1Loss=0.0621 + throughput/total_tokens=428,160,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2231/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=428,352,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2232/500000] + train/ActionL1Loss=0.0747 + throughput/total_tokens=428,544,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2233/500000] + train/ActionL1Loss=0.0645 + throughput/total_tokens=428,736,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2234/500000] + train/ActionL1Loss=0.0666 + throughput/total_tokens=428,928,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2235/500000] + train/ActionL1Loss=0.0736 + throughput/total_tokens=429,120,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2236/500000] + train/ActionL1Loss=0.0751 + throughput/total_tokens=429,312,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2237/500000] + train/ActionL1Loss=0.0755 + throughput/total_tokens=429,504,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2238/500000] + train/ActionL1Loss=0.0764 + throughput/total_tokens=429,696,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2239/500000] + train/ActionL1Loss=0.0952 + throughput/total_tokens=429,888,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2240/500000] + optim/total_grad_norm=9.390 + train/ActionL1Loss=0.0771 + throughput/total_tokens=430,080,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2241/500000] + train/ActionL1Loss=0.0730 + throughput/total_tokens=430,272,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2242/500000] + train/ActionL1Loss=0.0955 + throughput/total_tokens=430,464,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2243/500000] + train/ActionL1Loss=0.0794 + throughput/total_tokens=430,656,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2244/500000] + train/ActionL1Loss=0.0679 + throughput/total_tokens=430,848,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2245/500000] + train/ActionL1Loss=0.0739 + throughput/total_tokens=431,040,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2246/500000] + train/ActionL1Loss=0.0681 + throughput/total_tokens=431,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2247/500000] + train/ActionL1Loss=0.0683 + throughput/total_tokens=431,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2248/500000] + train/ActionL1Loss=0.0699 + throughput/total_tokens=431,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2249/500000] + train/ActionL1Loss=0.0740 + throughput/total_tokens=431,808,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2250/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=432,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2251/500000] + train/ActionL1Loss=0.0678 + throughput/total_tokens=432,192,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2252/500000] + train/ActionL1Loss=0.0835 + throughput/total_tokens=432,384,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2253/500000] + train/ActionL1Loss=0.0949 + throughput/total_tokens=432,576,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2254/500000] + train/ActionL1Loss=0.0807 + throughput/total_tokens=432,768,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2255/500000] + train/ActionL1Loss=0.0913 + throughput/total_tokens=432,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2256/500000] + train/ActionL1Loss=0.0920 + throughput/total_tokens=433,152,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2257/500000] + train/ActionL1Loss=0.0769 + throughput/total_tokens=433,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2258/500000] + train/ActionL1Loss=0.0798 + throughput/total_tokens=433,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2259/500000] + train/ActionL1Loss=0.0837 + throughput/total_tokens=433,728,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2260/500000] + optim/total_grad_norm=10.51 + train/ActionL1Loss=0.0819 + throughput/total_tokens=433,920,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2261/500000] + train/ActionL1Loss=0.0720 + throughput/total_tokens=434,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2262/500000] + train/ActionL1Loss=0.0685 + throughput/total_tokens=434,304,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2263/500000] + train/ActionL1Loss=0.0791 + throughput/total_tokens=434,496,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2264/500000] + train/ActionL1Loss=0.0746 + throughput/total_tokens=434,688,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2265/500000] + train/ActionL1Loss=0.0739 + throughput/total_tokens=434,880,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2266/500000] + train/ActionL1Loss=0.0770 + throughput/total_tokens=435,072,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2267/500000] + train/ActionL1Loss=0.0717 + throughput/total_tokens=435,264,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2268/500000] + train/ActionL1Loss=0.0703 + throughput/total_tokens=435,456,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2269/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=435,648,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2270/500000] + train/ActionL1Loss=0.0733 + throughput/total_tokens=435,840,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2271/500000] + train/ActionL1Loss=0.0721 + throughput/total_tokens=436,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2272/500000] + train/ActionL1Loss=0.0770 + throughput/total_tokens=436,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2273/500000] + train/ActionL1Loss=0.0650 + throughput/total_tokens=436,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2274/500000] + train/ActionL1Loss=0.0761 + throughput/total_tokens=436,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2275/500000] + train/ActionL1Loss=0.0644 + throughput/total_tokens=436,800,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2276/500000] + train/ActionL1Loss=0.0731 + throughput/total_tokens=436,992,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2277/500000] + train/ActionL1Loss=0.0744 + throughput/total_tokens=437,184,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2278/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=437,376,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2279/500000] + train/ActionL1Loss=0.0631 + throughput/total_tokens=437,568,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2280/500000] + optim/total_grad_norm=9.688 + train/ActionL1Loss=0.0748 + throughput/total_tokens=437,760,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2281/500000] + train/ActionL1Loss=0.0715 + throughput/total_tokens=437,952,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2282/500000] + train/ActionL1Loss=0.0692 + throughput/total_tokens=438,144,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2283/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=438,336,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2284/500000] + train/ActionL1Loss=0.0621 + throughput/total_tokens=438,528,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2285/500000] + train/ActionL1Loss=0.0683 + throughput/total_tokens=438,720,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2286/500000] + train/ActionL1Loss=0.0675 + throughput/total_tokens=438,912,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2287/500000] + train/ActionL1Loss=0.0677 + throughput/total_tokens=439,104,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2288/500000] + train/ActionL1Loss=0.0704 + throughput/total_tokens=439,296,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2289/500000] + train/ActionL1Loss=0.0606 + throughput/total_tokens=439,488,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2290/500000] + train/ActionL1Loss=0.0723 + throughput/total_tokens=439,680,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2291/500000] + train/ActionL1Loss=0.0703 + throughput/total_tokens=439,872,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2292/500000] + train/ActionL1Loss=0.0657 + throughput/total_tokens=440,064,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2293/500000] + train/ActionL1Loss=0.0663 + throughput/total_tokens=440,256,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2294/500000] + train/ActionL1Loss=0.0679 + throughput/total_tokens=440,448,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2295/500000] + train/ActionL1Loss=0.0619 + throughput/total_tokens=440,640,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2296/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=440,832,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2297/500000] + train/ActionL1Loss=0.0635 + throughput/total_tokens=441,024,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2298/500000] + train/ActionL1Loss=0.0760 + throughput/total_tokens=441,216,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2299/500000] + train/ActionL1Loss=0.0724 + throughput/total_tokens=441,408,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2300/500000] + optim/total_grad_norm=10.21 + train/ActionL1Loss=0.0625 + throughput/total_tokens=441,600,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2301/500000] + train/ActionL1Loss=0.0824 + throughput/total_tokens=441,792,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=2302/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=441,984,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2303/500000] + train/ActionL1Loss=0.0703 + throughput/total_tokens=442,176,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2304/500000] + train/ActionL1Loss=0.0747 + throughput/total_tokens=442,368,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2305/500000] + train/ActionL1Loss=0.0769 + throughput/total_tokens=442,560,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2306/500000] + train/ActionL1Loss=0.0693 + throughput/total_tokens=442,752,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2307/500000] + train/ActionL1Loss=0.0854 + throughput/total_tokens=442,944,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2308/500000] + train/ActionL1Loss=0.0611 + throughput/total_tokens=443,136,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2309/500000] + train/ActionL1Loss=0.0654 + throughput/total_tokens=443,328,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2310/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=443,520,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=2311/500000] + train/ActionL1Loss=0.0723 + throughput/total_tokens=443,712,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2312/500000] + train/ActionL1Loss=0.0896 + throughput/total_tokens=443,904,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2313/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=444,096,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=2314/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=444,288,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2315/500000] + train/ActionL1Loss=0.0715 + throughput/total_tokens=444,480,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2316/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=444,672,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2317/500000] + train/ActionL1Loss=0.0763 + throughput/total_tokens=444,864,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2318/500000] + train/ActionL1Loss=0.0658 + throughput/total_tokens=445,056,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2319/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=445,248,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2320/500000] + optim/total_grad_norm=8.484 + train/ActionL1Loss=0.0671 + throughput/total_tokens=445,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2321/500000] + train/ActionL1Loss=0.0896 + throughput/total_tokens=445,632,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2322/500000] + train/ActionL1Loss=0.0716 + throughput/total_tokens=445,824,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2323/500000] + train/ActionL1Loss=0.0696 + throughput/total_tokens=446,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2324/500000] + train/ActionL1Loss=0.0768 + throughput/total_tokens=446,208,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2325/500000] + train/ActionL1Loss=0.0808 + throughput/total_tokens=446,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2326/500000] + train/ActionL1Loss=0.0669 + throughput/total_tokens=446,592,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2327/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=446,784,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2328/500000] + train/ActionL1Loss=0.0673 + throughput/total_tokens=446,976,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2329/500000] + train/ActionL1Loss=0.0705 + throughput/total_tokens=447,168,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2330/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=447,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2331/500000] + train/ActionL1Loss=0.0711 + throughput/total_tokens=447,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2332/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=447,744,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2333/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=447,936,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2334/500000] + train/ActionL1Loss=0.0687 + throughput/total_tokens=448,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2335/500000] + train/ActionL1Loss=0.0686 + throughput/total_tokens=448,320,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2336/500000] + train/ActionL1Loss=0.0918 + throughput/total_tokens=448,512,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2337/500000] + train/ActionL1Loss=0.0868 + throughput/total_tokens=448,704,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2338/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=448,896,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2339/500000] + train/ActionL1Loss=0.0606 + throughput/total_tokens=449,088,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2340/500000] + optim/total_grad_norm=8.218 + train/ActionL1Loss=0.0664 + throughput/total_tokens=449,280,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2341/500000] + train/ActionL1Loss=0.0706 + throughput/total_tokens=449,472,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2342/500000] + train/ActionL1Loss=0.0617 + throughput/total_tokens=449,664,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2343/500000] + train/ActionL1Loss=0.0723 + throughput/total_tokens=449,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2344/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=450,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2345/500000] + train/ActionL1Loss=0.0630 + throughput/total_tokens=450,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2346/500000] + train/ActionL1Loss=0.0671 + throughput/total_tokens=450,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2347/500000] + train/ActionL1Loss=0.0778 + throughput/total_tokens=450,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2348/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=450,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2349/500000] + train/ActionL1Loss=0.0650 + throughput/total_tokens=451,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2350/500000] + train/ActionL1Loss=0.0887 + throughput/total_tokens=451,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2351/500000] + train/ActionL1Loss=0.0728 + throughput/total_tokens=451,392,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2352/500000] + train/ActionL1Loss=0.0668 + throughput/total_tokens=451,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2353/500000] + train/ActionL1Loss=0.0905 + throughput/total_tokens=451,776,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2354/500000] + train/ActionL1Loss=0.0865 + throughput/total_tokens=451,968,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2355/500000] + train/ActionL1Loss=0.0735 + throughput/total_tokens=452,160,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2356/500000] + train/ActionL1Loss=0.0819 + throughput/total_tokens=452,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2357/500000] + train/ActionL1Loss=0.0746 + throughput/total_tokens=452,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2358/500000] + train/ActionL1Loss=0.0660 + throughput/total_tokens=452,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2359/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=452,928,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2360/500000] + optim/total_grad_norm=11.03 + train/ActionL1Loss=0.0543 + throughput/total_tokens=453,120,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2361/500000] + train/ActionL1Loss=0.0702 + throughput/total_tokens=453,312,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2362/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=453,504,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2363/500000] + train/ActionL1Loss=0.0765 + throughput/total_tokens=453,696,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2364/500000] + train/ActionL1Loss=0.0814 + throughput/total_tokens=453,888,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2365/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=454,080,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2366/500000] + train/ActionL1Loss=0.0773 + throughput/total_tokens=454,272,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2367/500000] + train/ActionL1Loss=0.0757 + throughput/total_tokens=454,464,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2368/500000] + train/ActionL1Loss=0.0724 + throughput/total_tokens=454,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2369/500000] + train/ActionL1Loss=0.0678 + throughput/total_tokens=454,848,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2370/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=455,040,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2371/500000] + train/ActionL1Loss=0.0766 + throughput/total_tokens=455,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2372/500000] + train/ActionL1Loss=0.0889 + throughput/total_tokens=455,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2373/500000] + train/ActionL1Loss=0.0673 + throughput/total_tokens=455,616,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2374/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=455,808,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2375/500000] + train/ActionL1Loss=0.0773 + throughput/total_tokens=456,000,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2376/500000] + train/ActionL1Loss=0.0618 + throughput/total_tokens=456,192,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2377/500000] + train/ActionL1Loss=0.0773 + throughput/total_tokens=456,384,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2378/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=456,576,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2379/500000] + train/ActionL1Loss=0.0682 + throughput/total_tokens=456,768,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2380/500000] + optim/total_grad_norm=10.23 + train/ActionL1Loss=0.0847 + throughput/total_tokens=456,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2381/500000] + train/ActionL1Loss=0.0825 + throughput/total_tokens=457,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2382/500000] + train/ActionL1Loss=0.0792 + throughput/total_tokens=457,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2383/500000] + train/ActionL1Loss=0.0789 + throughput/total_tokens=457,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2384/500000] + train/ActionL1Loss=0.0946 + throughput/total_tokens=457,728,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2385/500000] + train/ActionL1Loss=0.0778 + throughput/total_tokens=457,920,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2386/500000] + train/ActionL1Loss=0.0638 + throughput/total_tokens=458,112,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2387/500000] + train/ActionL1Loss=0.0870 + throughput/total_tokens=458,304,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2388/500000] + train/ActionL1Loss=0.0824 + throughput/total_tokens=458,496,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2389/500000] + train/ActionL1Loss=0.0905 + throughput/total_tokens=458,688,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2390/500000] + train/ActionL1Loss=0.0724 + throughput/total_tokens=458,880,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2391/500000] + train/ActionL1Loss=0.0784 + throughput/total_tokens=459,072,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2392/500000] + train/ActionL1Loss=0.0796 + throughput/total_tokens=459,264,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2393/500000] + train/ActionL1Loss=0.0760 + throughput/total_tokens=459,456,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2394/500000] + train/ActionL1Loss=0.0680 + throughput/total_tokens=459,648,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2395/500000] + train/ActionL1Loss=0.0615 + throughput/total_tokens=459,840,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2396/500000] + train/ActionL1Loss=0.0928 + throughput/total_tokens=460,032,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2397/500000] + train/ActionL1Loss=0.0864 + throughput/total_tokens=460,224,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2398/500000] + train/ActionL1Loss=0.0683 + throughput/total_tokens=460,416,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2399/500000] + train/ActionL1Loss=0.0651 + throughput/total_tokens=460,608,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2400/500000] + optim/total_grad_norm=9.316 + train/ActionL1Loss=0.0566 + throughput/total_tokens=460,800,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2401/500000] + train/ActionL1Loss=0.0623 + throughput/total_tokens=460,992,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2402/500000] + train/ActionL1Loss=0.0717 + throughput/total_tokens=461,184,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2403/500000] + train/ActionL1Loss=0.0774 + throughput/total_tokens=461,376,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2404/500000] + train/ActionL1Loss=0.0761 + throughput/total_tokens=461,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2405/500000] + train/ActionL1Loss=0.0683 + throughput/total_tokens=461,760,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2406/500000] + train/ActionL1Loss=0.0742 + throughput/total_tokens=461,952,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2407/500000] + train/ActionL1Loss=0.0788 + throughput/total_tokens=462,144,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2408/500000] + train/ActionL1Loss=0.0712 + throughput/total_tokens=462,336,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2409/500000] + train/ActionL1Loss=0.0663 + throughput/total_tokens=462,528,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2410/500000] + train/ActionL1Loss=0.0719 + throughput/total_tokens=462,720,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2411/500000] + train/ActionL1Loss=0.0691 + throughput/total_tokens=462,912,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2412/500000] + train/ActionL1Loss=0.0723 + throughput/total_tokens=463,104,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2413/500000] + train/ActionL1Loss=0.0631 + throughput/total_tokens=463,296,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=2414/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=463,488,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2415/500000] + train/ActionL1Loss=0.0631 + throughput/total_tokens=463,680,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2416/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=463,872,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2417/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=464,064,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2418/500000] + train/ActionL1Loss=0.0811 + throughput/total_tokens=464,256,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2419/500000] + train/ActionL1Loss=0.0758 + throughput/total_tokens=464,448,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2420/500000] + optim/total_grad_norm=7.690 + train/ActionL1Loss=0.0551 + throughput/total_tokens=464,640,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2421/500000] + train/ActionL1Loss=0.0725 + throughput/total_tokens=464,832,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2422/500000] + train/ActionL1Loss=0.0677 + throughput/total_tokens=465,024,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2423/500000] + train/ActionL1Loss=0.0692 + throughput/total_tokens=465,216,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2424/500000] + train/ActionL1Loss=0.0719 + throughput/total_tokens=465,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2425/500000] + train/ActionL1Loss=0.0688 + throughput/total_tokens=465,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2426/500000] + train/ActionL1Loss=0.0564 + throughput/total_tokens=465,792,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2427/500000] + train/ActionL1Loss=0.0657 + throughput/total_tokens=465,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2428/500000] + train/ActionL1Loss=0.0702 + throughput/total_tokens=466,176,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2429/500000] + train/ActionL1Loss=0.0795 + throughput/total_tokens=466,368,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2430/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=466,560,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2431/500000] + train/ActionL1Loss=0.0698 + throughput/total_tokens=466,752,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2432/500000] + train/ActionL1Loss=0.0820 + throughput/total_tokens=466,944,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2433/500000] + train/ActionL1Loss=0.0905 + throughput/total_tokens=467,136,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2434/500000] + train/ActionL1Loss=0.0795 + throughput/total_tokens=467,328,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2435/500000] + train/ActionL1Loss=0.0661 + throughput/total_tokens=467,520,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2436/500000] + train/ActionL1Loss=0.0781 + throughput/total_tokens=467,712,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2437/500000] + train/ActionL1Loss=0.0777 + throughput/total_tokens=467,904,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2438/500000] + train/ActionL1Loss=0.0686 + throughput/total_tokens=468,096,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2439/500000] + train/ActionL1Loss=0.0758 + throughput/total_tokens=468,288,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2440/500000] + optim/total_grad_norm=9.484 + train/ActionL1Loss=0.0831 + throughput/total_tokens=468,480,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2441/500000] + train/ActionL1Loss=0.0793 + throughput/total_tokens=468,672,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2442/500000] + train/ActionL1Loss=0.0841 + throughput/total_tokens=468,864,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2443/500000] + train/ActionL1Loss=0.0801 + throughput/total_tokens=469,056,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2444/500000] + train/ActionL1Loss=0.0752 + throughput/total_tokens=469,248,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2445/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=469,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2446/500000] + train/ActionL1Loss=0.0699 + throughput/total_tokens=469,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2447/500000] + train/ActionL1Loss=0.0821 + throughput/total_tokens=469,824,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2448/500000] + train/ActionL1Loss=0.0827 + throughput/total_tokens=470,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2449/500000] + train/ActionL1Loss=0.0837 + throughput/total_tokens=470,208,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2450/500000] + train/ActionL1Loss=0.0693 + throughput/total_tokens=470,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2451/500000] + train/ActionL1Loss=0.0804 + throughput/total_tokens=470,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2452/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=470,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2453/500000] + train/ActionL1Loss=0.0732 + throughput/total_tokens=470,976,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2454/500000] + train/ActionL1Loss=0.0756 + throughput/total_tokens=471,168,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2455/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=471,360,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2456/500000] + train/ActionL1Loss=0.0607 + throughput/total_tokens=471,552,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2457/500000] + train/ActionL1Loss=0.0676 + throughput/total_tokens=471,744,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2458/500000] + train/ActionL1Loss=0.1015 + throughput/total_tokens=471,936,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2459/500000] + train/ActionL1Loss=0.0802 + throughput/total_tokens=472,128,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2460/500000] + optim/total_grad_norm=7.506 + train/ActionL1Loss=0.0717 + throughput/total_tokens=472,320,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2461/500000] + train/ActionL1Loss=0.0680 + throughput/total_tokens=472,512,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2462/500000] + train/ActionL1Loss=0.0765 + throughput/total_tokens=472,704,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2463/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=472,896,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2464/500000] + train/ActionL1Loss=0.0928 + throughput/total_tokens=473,088,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2465/500000] + train/ActionL1Loss=0.0815 + throughput/total_tokens=473,280,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2466/500000] + train/ActionL1Loss=0.0795 + throughput/total_tokens=473,472,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2467/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=473,664,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2468/500000] + train/ActionL1Loss=0.0800 + throughput/total_tokens=473,856,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2469/500000] + train/ActionL1Loss=0.0607 + throughput/total_tokens=474,048,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2470/500000] + train/ActionL1Loss=0.0659 + throughput/total_tokens=474,240,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2471/500000] + train/ActionL1Loss=0.0724 + throughput/total_tokens=474,432,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2472/500000] + train/ActionL1Loss=0.0755 + throughput/total_tokens=474,624,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2473/500000] + train/ActionL1Loss=0.0760 + throughput/total_tokens=474,816,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2474/500000] + train/ActionL1Loss=0.0754 + throughput/total_tokens=475,008,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2475/500000] + train/ActionL1Loss=0.0735 + throughput/total_tokens=475,200,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2476/500000] + train/ActionL1Loss=0.0735 + throughput/total_tokens=475,392,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2477/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=475,584,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2478/500000] + train/ActionL1Loss=0.0657 + throughput/total_tokens=475,776,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2479/500000] + train/ActionL1Loss=0.0638 + throughput/total_tokens=475,968,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2480/500000] + optim/total_grad_norm=7.363 + train/ActionL1Loss=0.0527 + throughput/total_tokens=476,160,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2481/500000] + train/ActionL1Loss=0.0872 + throughput/total_tokens=476,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2482/500000] + train/ActionL1Loss=0.0730 + throughput/total_tokens=476,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2483/500000] + train/ActionL1Loss=0.0800 + throughput/total_tokens=476,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2484/500000] + train/ActionL1Loss=0.0779 + throughput/total_tokens=476,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2485/500000] + train/ActionL1Loss=0.0805 + throughput/total_tokens=477,120,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2486/500000] + train/ActionL1Loss=0.0711 + throughput/total_tokens=477,312,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2487/500000] + train/ActionL1Loss=0.0792 + throughput/total_tokens=477,504,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2488/500000] + train/ActionL1Loss=0.0821 + throughput/total_tokens=477,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2489/500000] + train/ActionL1Loss=0.0862 + throughput/total_tokens=477,888,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2490/500000] + train/ActionL1Loss=0.0728 + throughput/total_tokens=478,080,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2491/500000] + train/ActionL1Loss=0.0686 + throughput/total_tokens=478,272,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2492/500000] + train/ActionL1Loss=0.0774 + throughput/total_tokens=478,464,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2493/500000] + train/ActionL1Loss=0.0697 + throughput/total_tokens=478,656,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2494/500000] + train/ActionL1Loss=0.0784 + throughput/total_tokens=478,848,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2495/500000] + train/ActionL1Loss=0.0747 + throughput/total_tokens=479,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2496/500000] + train/ActionL1Loss=0.0826 + throughput/total_tokens=479,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2497/500000] + train/ActionL1Loss=0.0754 + throughput/total_tokens=479,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2498/500000] + train/ActionL1Loss=0.0805 + throughput/total_tokens=479,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2499/500000] + train/ActionL1Loss=0.0800 + throughput/total_tokens=479,808,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2500/500000] + optim/total_grad_norm=10.89 + train/ActionL1Loss=0.0586 + throughput/total_tokens=480,000,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +10/12 [07:10:42] INFO | >> Saving config... checkpoint.py:608 +10/12 [07:11:14] INFO | >> Saving model state... checkpoint.py:796 +10/12 [07:12:24] INFO | >> Saving optim state... checkpoint.py:811 +10/12 [07:13:48] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=2501/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=480,192,000 + throughput/device/tokens_per_second=1,207 + throughput/device/batches_per_second=0.0503 +[step=2502/500000] + train/ActionL1Loss=0.0767 + throughput/total_tokens=480,384,000 + throughput/device/tokens_per_second=1,192 + throughput/device/batches_per_second=0.0497 +[step=2503/500000] + train/ActionL1Loss=0.0735 + throughput/total_tokens=480,576,000 + throughput/device/tokens_per_second=1,188 + throughput/device/batches_per_second=0.0495 +[step=2504/500000] + train/ActionL1Loss=0.0630 + throughput/total_tokens=480,768,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=2505/500000] + train/ActionL1Loss=0.0678 + throughput/total_tokens=480,960,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2506/500000] + train/ActionL1Loss=0.0769 + throughput/total_tokens=481,152,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2507/500000] + train/ActionL1Loss=0.0725 + throughput/total_tokens=481,344,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2508/500000] + train/ActionL1Loss=0.0697 + throughput/total_tokens=481,536,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2509/500000] + train/ActionL1Loss=0.0812 + throughput/total_tokens=481,728,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2510/500000] + train/ActionL1Loss=0.0726 + throughput/total_tokens=481,920,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2511/500000] + train/ActionL1Loss=0.0757 + throughput/total_tokens=482,112,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2512/500000] + train/ActionL1Loss=0.0773 + throughput/total_tokens=482,304,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2513/500000] + train/ActionL1Loss=0.0749 + throughput/total_tokens=482,496,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2514/500000] + train/ActionL1Loss=0.0816 + throughput/total_tokens=482,688,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2515/500000] + train/ActionL1Loss=0.0706 + throughput/total_tokens=482,880,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2516/500000] + train/ActionL1Loss=0.0687 + throughput/total_tokens=483,072,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2517/500000] + train/ActionL1Loss=0.0668 + throughput/total_tokens=483,264,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2518/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=483,456,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2519/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=483,648,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2520/500000] + optim/total_grad_norm=10.41 + train/ActionL1Loss=0.0777 + throughput/total_tokens=483,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2521/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=484,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2522/500000] + train/ActionL1Loss=0.0751 + throughput/total_tokens=484,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2523/500000] + train/ActionL1Loss=0.0753 + throughput/total_tokens=484,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2524/500000] + train/ActionL1Loss=0.0765 + throughput/total_tokens=484,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2525/500000] + train/ActionL1Loss=0.0677 + throughput/total_tokens=484,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2526/500000] + train/ActionL1Loss=0.0756 + throughput/total_tokens=484,992,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2527/500000] + train/ActionL1Loss=0.0802 + throughput/total_tokens=485,184,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2528/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=485,376,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2529/500000] + train/ActionL1Loss=0.0744 + throughput/total_tokens=485,568,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2530/500000] + train/ActionL1Loss=0.0775 + throughput/total_tokens=485,760,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2531/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=485,952,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2532/500000] + train/ActionL1Loss=0.0656 + throughput/total_tokens=486,144,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2533/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=486,336,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2534/500000] + train/ActionL1Loss=0.0681 + throughput/total_tokens=486,528,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2535/500000] + train/ActionL1Loss=0.0738 + throughput/total_tokens=486,720,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2536/500000] + train/ActionL1Loss=0.0784 + throughput/total_tokens=486,912,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2537/500000] + train/ActionL1Loss=0.0709 + throughput/total_tokens=487,104,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2538/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=487,296,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2539/500000] + train/ActionL1Loss=0.0859 + throughput/total_tokens=487,488,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2540/500000] + optim/total_grad_norm=9.774 + train/ActionL1Loss=0.0606 + throughput/total_tokens=487,680,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=2541/500000] + train/ActionL1Loss=0.0718 + throughput/total_tokens=487,872,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2542/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=488,064,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2543/500000] + train/ActionL1Loss=0.0719 + throughput/total_tokens=488,256,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2544/500000] + train/ActionL1Loss=0.0768 + throughput/total_tokens=488,448,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2545/500000] + train/ActionL1Loss=0.0724 + throughput/total_tokens=488,640,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2546/500000] + train/ActionL1Loss=0.0661 + throughput/total_tokens=488,832,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2547/500000] + train/ActionL1Loss=0.0729 + throughput/total_tokens=489,024,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2548/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=489,216,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2549/500000] + train/ActionL1Loss=0.0800 + throughput/total_tokens=489,408,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2550/500000] + train/ActionL1Loss=0.0739 + throughput/total_tokens=489,600,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2551/500000] + train/ActionL1Loss=0.0666 + throughput/total_tokens=489,792,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2552/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=489,984,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2553/500000] + train/ActionL1Loss=0.0853 + throughput/total_tokens=490,176,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2554/500000] + train/ActionL1Loss=0.0748 + throughput/total_tokens=490,368,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2555/500000] + train/ActionL1Loss=0.0694 + throughput/total_tokens=490,560,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2556/500000] + train/ActionL1Loss=0.0574 + throughput/total_tokens=490,752,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2557/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=490,944,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2558/500000] + train/ActionL1Loss=0.0641 + throughput/total_tokens=491,136,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2559/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=491,328,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2560/500000] + optim/total_grad_norm=9.217 + train/ActionL1Loss=0.0701 + throughput/total_tokens=491,520,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2561/500000] + train/ActionL1Loss=0.0686 + throughput/total_tokens=491,712,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2562/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=491,904,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2563/500000] + train/ActionL1Loss=0.0617 + throughput/total_tokens=492,096,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2564/500000] + train/ActionL1Loss=0.0834 + throughput/total_tokens=492,288,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2565/500000] + train/ActionL1Loss=0.0737 + throughput/total_tokens=492,480,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2566/500000] + train/ActionL1Loss=0.0795 + throughput/total_tokens=492,672,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2567/500000] + train/ActionL1Loss=0.0827 + throughput/total_tokens=492,864,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2568/500000] + train/ActionL1Loss=0.0651 + throughput/total_tokens=493,056,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2569/500000] + train/ActionL1Loss=0.0696 + throughput/total_tokens=493,248,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2570/500000] + train/ActionL1Loss=0.0647 + throughput/total_tokens=493,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2571/500000] + train/ActionL1Loss=0.0643 + throughput/total_tokens=493,632,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2572/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=493,824,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2573/500000] + train/ActionL1Loss=0.0778 + throughput/total_tokens=494,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2574/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=494,208,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2575/500000] + train/ActionL1Loss=0.0711 + throughput/total_tokens=494,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2576/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=494,592,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2577/500000] + train/ActionL1Loss=0.0805 + throughput/total_tokens=494,784,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2578/500000] + train/ActionL1Loss=0.0737 + throughput/total_tokens=494,976,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2579/500000] + train/ActionL1Loss=0.0742 + throughput/total_tokens=495,168,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2580/500000] + optim/total_grad_norm=8.253 + train/ActionL1Loss=0.0550 + throughput/total_tokens=495,360,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2581/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=495,552,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2582/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=495,744,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2583/500000] + train/ActionL1Loss=0.0761 + throughput/total_tokens=495,936,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2584/500000] + train/ActionL1Loss=0.0660 + throughput/total_tokens=496,128,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2585/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=496,320,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2586/500000] + train/ActionL1Loss=0.0867 + throughput/total_tokens=496,512,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2587/500000] + train/ActionL1Loss=0.0761 + throughput/total_tokens=496,704,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2588/500000] + train/ActionL1Loss=0.0792 + throughput/total_tokens=496,896,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2589/500000] + train/ActionL1Loss=0.0712 + throughput/total_tokens=497,088,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2590/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=497,280,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2591/500000] + train/ActionL1Loss=0.0699 + throughput/total_tokens=497,472,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2592/500000] + train/ActionL1Loss=0.0778 + throughput/total_tokens=497,664,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2593/500000] + train/ActionL1Loss=0.0728 + throughput/total_tokens=497,856,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2594/500000] + train/ActionL1Loss=0.0641 + throughput/total_tokens=498,048,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2595/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=498,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2596/500000] + train/ActionL1Loss=0.0806 + throughput/total_tokens=498,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2597/500000] + train/ActionL1Loss=0.0668 + throughput/total_tokens=498,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2598/500000] + train/ActionL1Loss=0.0702 + throughput/total_tokens=498,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2599/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=499,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2600/500000] + optim/total_grad_norm=9.056 + train/ActionL1Loss=0.0658 + throughput/total_tokens=499,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2601/500000] + train/ActionL1Loss=0.0720 + throughput/total_tokens=499,392,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2602/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=499,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2603/500000] + train/ActionL1Loss=0.0798 + throughput/total_tokens=499,776,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2604/500000] + train/ActionL1Loss=0.0805 + throughput/total_tokens=499,968,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2605/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=500,160,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2606/500000] + train/ActionL1Loss=0.0704 + throughput/total_tokens=500,352,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2607/500000] + train/ActionL1Loss=0.0647 + throughput/total_tokens=500,544,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2608/500000] + train/ActionL1Loss=0.0732 + throughput/total_tokens=500,736,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2609/500000] + train/ActionL1Loss=0.0720 + throughput/total_tokens=500,928,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2610/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=501,120,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2611/500000] + train/ActionL1Loss=0.0748 + throughput/total_tokens=501,312,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2612/500000] + train/ActionL1Loss=0.0772 + throughput/total_tokens=501,504,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2613/500000] + train/ActionL1Loss=0.0789 + throughput/total_tokens=501,696,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2614/500000] + train/ActionL1Loss=0.0600 + throughput/total_tokens=501,888,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2615/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=502,080,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2616/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=502,272,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2617/500000] + train/ActionL1Loss=0.0809 + throughput/total_tokens=502,464,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2618/500000] + train/ActionL1Loss=0.0793 + throughput/total_tokens=502,656,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2619/500000] + train/ActionL1Loss=0.0760 + throughput/total_tokens=502,848,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2620/500000] + optim/total_grad_norm=9.609 + train/ActionL1Loss=0.0765 + throughput/total_tokens=503,040,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2621/500000] + train/ActionL1Loss=0.0709 + throughput/total_tokens=503,232,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2622/500000] + train/ActionL1Loss=0.0669 + throughput/total_tokens=503,424,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2623/500000] + train/ActionL1Loss=0.0663 + throughput/total_tokens=503,616,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2624/500000] + train/ActionL1Loss=0.0666 + throughput/total_tokens=503,808,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2625/500000] + train/ActionL1Loss=0.0645 + throughput/total_tokens=504,000,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2626/500000] + train/ActionL1Loss=0.0757 + throughput/total_tokens=504,192,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2627/500000] + train/ActionL1Loss=0.0692 + throughput/total_tokens=504,384,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2628/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=504,576,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2629/500000] + train/ActionL1Loss=0.0732 + throughput/total_tokens=504,768,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2630/500000] + train/ActionL1Loss=0.0722 + throughput/total_tokens=504,960,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2631/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=505,152,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2632/500000] + train/ActionL1Loss=0.0786 + throughput/total_tokens=505,344,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2633/500000] + train/ActionL1Loss=0.0767 + throughput/total_tokens=505,536,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2634/500000] + train/ActionL1Loss=0.0823 + throughput/total_tokens=505,728,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2635/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=505,920,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2636/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=506,112,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2637/500000] + train/ActionL1Loss=0.0753 + throughput/total_tokens=506,304,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2638/500000] + train/ActionL1Loss=0.0766 + throughput/total_tokens=506,496,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2639/500000] + train/ActionL1Loss=0.0850 + throughput/total_tokens=506,688,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2640/500000] + optim/total_grad_norm=9.617 + train/ActionL1Loss=0.0620 + throughput/total_tokens=506,880,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2641/500000] + train/ActionL1Loss=0.0696 + throughput/total_tokens=507,072,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2642/500000] + train/ActionL1Loss=0.0712 + throughput/total_tokens=507,264,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2643/500000] + train/ActionL1Loss=0.0663 + throughput/total_tokens=507,456,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2644/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=507,648,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2645/500000] + train/ActionL1Loss=0.0703 + throughput/total_tokens=507,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2646/500000] + train/ActionL1Loss=0.0775 + throughput/total_tokens=508,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2647/500000] + train/ActionL1Loss=0.0727 + throughput/total_tokens=508,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2648/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=508,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2649/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=508,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2650/500000] + train/ActionL1Loss=0.0700 + throughput/total_tokens=508,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2651/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=508,992,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2652/500000] + train/ActionL1Loss=0.0875 + throughput/total_tokens=509,184,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2653/500000] + train/ActionL1Loss=0.0679 + throughput/total_tokens=509,376,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=2654/500000] + train/ActionL1Loss=0.0661 + throughput/total_tokens=509,568,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=2655/500000] + train/ActionL1Loss=0.0717 + throughput/total_tokens=509,760,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2656/500000] + train/ActionL1Loss=0.0685 + throughput/total_tokens=509,952,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2657/500000] + train/ActionL1Loss=0.0715 + throughput/total_tokens=510,144,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2658/500000] + train/ActionL1Loss=0.0585 + throughput/total_tokens=510,336,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2659/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=510,528,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2660/500000] + optim/total_grad_norm=9.644 + train/ActionL1Loss=0.0609 + throughput/total_tokens=510,720,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=2661/500000] + train/ActionL1Loss=0.0786 + throughput/total_tokens=510,912,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2662/500000] + train/ActionL1Loss=0.0711 + throughput/total_tokens=511,104,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2663/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=511,296,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2664/500000] + train/ActionL1Loss=0.0663 + throughput/total_tokens=511,488,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2665/500000] + train/ActionL1Loss=0.0722 + throughput/total_tokens=511,680,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2666/500000] + train/ActionL1Loss=0.0741 + throughput/total_tokens=511,872,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2667/500000] + train/ActionL1Loss=0.0791 + throughput/total_tokens=512,064,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2668/500000] + train/ActionL1Loss=0.0740 + throughput/total_tokens=512,256,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2669/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=512,448,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2670/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=512,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2671/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=512,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2672/500000] + train/ActionL1Loss=0.0686 + throughput/total_tokens=513,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2673/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=513,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2674/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=513,408,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2675/500000] + train/ActionL1Loss=0.0746 + throughput/total_tokens=513,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2676/500000] + train/ActionL1Loss=0.0745 + throughput/total_tokens=513,792,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2677/500000] + train/ActionL1Loss=0.0681 + throughput/total_tokens=513,984,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2678/500000] + train/ActionL1Loss=0.0601 + throughput/total_tokens=514,176,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2679/500000] + train/ActionL1Loss=0.0702 + throughput/total_tokens=514,368,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2680/500000] + optim/total_grad_norm=10.25 + train/ActionL1Loss=0.0581 + throughput/total_tokens=514,560,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2681/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=514,752,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2682/500000] + train/ActionL1Loss=0.0697 + throughput/total_tokens=514,944,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2683/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=515,136,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2684/500000] + train/ActionL1Loss=0.0632 + throughput/total_tokens=515,328,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2685/500000] + train/ActionL1Loss=0.0736 + throughput/total_tokens=515,520,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2686/500000] + train/ActionL1Loss=0.0626 + throughput/total_tokens=515,712,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2687/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=515,904,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2688/500000] + train/ActionL1Loss=0.0824 + throughput/total_tokens=516,096,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2689/500000] + train/ActionL1Loss=0.0706 + throughput/total_tokens=516,288,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2690/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=516,480,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2691/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=516,672,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2692/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=516,864,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2693/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=517,056,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2694/500000] + train/ActionL1Loss=0.0656 + throughput/total_tokens=517,248,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2695/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=517,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2696/500000] + train/ActionL1Loss=0.0679 + throughput/total_tokens=517,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2697/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=517,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2698/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=518,016,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2699/500000] + train/ActionL1Loss=0.0656 + throughput/total_tokens=518,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2700/500000] + optim/total_grad_norm=10.55 + train/ActionL1Loss=0.0636 + throughput/total_tokens=518,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2701/500000] + train/ActionL1Loss=0.0737 + throughput/total_tokens=518,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2702/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=518,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2703/500000] + train/ActionL1Loss=0.0584 + throughput/total_tokens=518,976,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2704/500000] + train/ActionL1Loss=0.0644 + throughput/total_tokens=519,168,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2705/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=519,360,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2706/500000] + train/ActionL1Loss=0.0722 + throughput/total_tokens=519,552,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2707/500000] + train/ActionL1Loss=0.0730 + throughput/total_tokens=519,744,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2708/500000] + train/ActionL1Loss=0.0854 + throughput/total_tokens=519,936,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2709/500000] + train/ActionL1Loss=0.0689 + throughput/total_tokens=520,128,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2710/500000] + train/ActionL1Loss=0.0664 + throughput/total_tokens=520,320,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2711/500000] + train/ActionL1Loss=0.0816 + throughput/total_tokens=520,512,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2712/500000] + train/ActionL1Loss=0.0729 + throughput/total_tokens=520,704,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2713/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=520,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2714/500000] + train/ActionL1Loss=0.0677 + throughput/total_tokens=521,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2715/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=521,280,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2716/500000] + train/ActionL1Loss=0.0695 + throughput/total_tokens=521,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2717/500000] + train/ActionL1Loss=0.0698 + throughput/total_tokens=521,664,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2718/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=521,856,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2719/500000] + train/ActionL1Loss=0.0779 + throughput/total_tokens=522,048,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2720/500000] + optim/total_grad_norm=9.741 + train/ActionL1Loss=0.0664 + throughput/total_tokens=522,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2721/500000] + train/ActionL1Loss=0.0706 + throughput/total_tokens=522,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2722/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=522,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2723/500000] + train/ActionL1Loss=0.0587 + throughput/total_tokens=522,816,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2724/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=523,008,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2725/500000] + train/ActionL1Loss=0.0691 + throughput/total_tokens=523,200,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2726/500000] + train/ActionL1Loss=0.0757 + throughput/total_tokens=523,392,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2727/500000] + train/ActionL1Loss=0.0747 + throughput/total_tokens=523,584,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2728/500000] + train/ActionL1Loss=0.0705 + throughput/total_tokens=523,776,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2729/500000] + train/ActionL1Loss=0.0664 + throughput/total_tokens=523,968,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2730/500000] + train/ActionL1Loss=0.0710 + throughput/total_tokens=524,160,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2731/500000] + train/ActionL1Loss=0.0678 + throughput/total_tokens=524,352,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2732/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=524,544,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2733/500000] + train/ActionL1Loss=0.0629 + throughput/total_tokens=524,736,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2734/500000] + train/ActionL1Loss=0.0732 + throughput/total_tokens=524,928,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2735/500000] + train/ActionL1Loss=0.0786 + throughput/total_tokens=525,120,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2736/500000] + train/ActionL1Loss=0.0875 + throughput/total_tokens=525,312,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2737/500000] + train/ActionL1Loss=0.0619 + throughput/total_tokens=525,504,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2738/500000] + train/ActionL1Loss=0.0808 + throughput/total_tokens=525,696,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2739/500000] + train/ActionL1Loss=0.0777 + throughput/total_tokens=525,888,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2740/500000] + optim/total_grad_norm=8.627 + train/ActionL1Loss=0.0718 + throughput/total_tokens=526,080,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2741/500000] + train/ActionL1Loss=0.0738 + throughput/total_tokens=526,272,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2742/500000] + train/ActionL1Loss=0.0631 + throughput/total_tokens=526,464,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2743/500000] + train/ActionL1Loss=0.0657 + throughput/total_tokens=526,656,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2744/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=526,848,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2745/500000] + train/ActionL1Loss=0.0688 + throughput/total_tokens=527,040,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2746/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=527,232,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2747/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=527,424,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2748/500000] + train/ActionL1Loss=0.0750 + throughput/total_tokens=527,616,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2749/500000] + train/ActionL1Loss=0.0674 + throughput/total_tokens=527,808,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2750/500000] + train/ActionL1Loss=0.0753 + throughput/total_tokens=528,000,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2751/500000] + train/ActionL1Loss=0.0672 + throughput/total_tokens=528,192,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2752/500000] + train/ActionL1Loss=0.0715 + throughput/total_tokens=528,384,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=2753/500000] + train/ActionL1Loss=0.0721 + throughput/total_tokens=528,576,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=2754/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=528,768,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2755/500000] + train/ActionL1Loss=0.0810 + throughput/total_tokens=528,960,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2756/500000] + train/ActionL1Loss=0.0664 + throughput/total_tokens=529,152,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2757/500000] + train/ActionL1Loss=0.0651 + throughput/total_tokens=529,344,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2758/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=529,536,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2759/500000] + train/ActionL1Loss=0.0574 + throughput/total_tokens=529,728,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2760/500000] + optim/total_grad_norm=9.747 + train/ActionL1Loss=0.0580 + throughput/total_tokens=529,920,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=2761/500000] + train/ActionL1Loss=0.0607 + throughput/total_tokens=530,112,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=2762/500000] + train/ActionL1Loss=0.0701 + throughput/total_tokens=530,304,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2763/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=530,496,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2764/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=530,688,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=2765/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=530,880,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=2766/500000] + train/ActionL1Loss=0.0625 + throughput/total_tokens=531,072,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2767/500000] + train/ActionL1Loss=0.0814 + throughput/total_tokens=531,264,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2768/500000] + train/ActionL1Loss=0.0645 + throughput/total_tokens=531,456,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2769/500000] + train/ActionL1Loss=0.0666 + throughput/total_tokens=531,648,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=2770/500000] + train/ActionL1Loss=0.0585 + throughput/total_tokens=531,840,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2771/500000] + train/ActionL1Loss=0.0626 + throughput/total_tokens=532,032,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2772/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=532,224,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2773/500000] + train/ActionL1Loss=0.0747 + throughput/total_tokens=532,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2774/500000] + train/ActionL1Loss=0.0695 + throughput/total_tokens=532,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2775/500000] + train/ActionL1Loss=0.0667 + throughput/total_tokens=532,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2776/500000] + train/ActionL1Loss=0.0812 + throughput/total_tokens=532,992,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2777/500000] + train/ActionL1Loss=0.0832 + throughput/total_tokens=533,184,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2778/500000] + train/ActionL1Loss=0.0623 + throughput/total_tokens=533,376,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2779/500000] + train/ActionL1Loss=0.0640 + throughput/total_tokens=533,568,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2780/500000] + optim/total_grad_norm=10.71 + train/ActionL1Loss=0.0644 + throughput/total_tokens=533,760,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2781/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=533,952,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2782/500000] + train/ActionL1Loss=0.0653 + throughput/total_tokens=534,144,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2783/500000] + train/ActionL1Loss=0.0698 + throughput/total_tokens=534,336,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2784/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=534,528,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2785/500000] + train/ActionL1Loss=0.0738 + throughput/total_tokens=534,720,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2786/500000] + train/ActionL1Loss=0.0739 + throughput/total_tokens=534,912,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2787/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=535,104,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2788/500000] + train/ActionL1Loss=0.0624 + throughput/total_tokens=535,296,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2789/500000] + train/ActionL1Loss=0.0685 + throughput/total_tokens=535,488,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2790/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=535,680,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2791/500000] + train/ActionL1Loss=0.0723 + throughput/total_tokens=535,872,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2792/500000] + train/ActionL1Loss=0.0666 + throughput/total_tokens=536,064,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2793/500000] + train/ActionL1Loss=0.0615 + throughput/total_tokens=536,256,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2794/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=536,448,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2795/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=536,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2796/500000] + train/ActionL1Loss=0.0776 + throughput/total_tokens=536,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2797/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=537,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2798/500000] + train/ActionL1Loss=0.0628 + throughput/total_tokens=537,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2799/500000] + train/ActionL1Loss=0.0642 + throughput/total_tokens=537,408,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2800/500000] + optim/total_grad_norm=7.757 + train/ActionL1Loss=0.0593 + throughput/total_tokens=537,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2801/500000] + train/ActionL1Loss=0.0631 + throughput/total_tokens=537,792,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2802/500000] + train/ActionL1Loss=0.0753 + throughput/total_tokens=537,984,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2803/500000] + train/ActionL1Loss=0.0640 + throughput/total_tokens=538,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2804/500000] + train/ActionL1Loss=0.0740 + throughput/total_tokens=538,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2805/500000] + train/ActionL1Loss=0.0798 + throughput/total_tokens=538,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2806/500000] + train/ActionL1Loss=0.0711 + throughput/total_tokens=538,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2807/500000] + train/ActionL1Loss=0.0768 + throughput/total_tokens=538,944,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2808/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=539,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2809/500000] + train/ActionL1Loss=0.0825 + throughput/total_tokens=539,328,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2810/500000] + train/ActionL1Loss=0.0789 + throughput/total_tokens=539,520,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2811/500000] + train/ActionL1Loss=0.0669 + throughput/total_tokens=539,712,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2812/500000] + train/ActionL1Loss=0.0783 + throughput/total_tokens=539,904,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2813/500000] + train/ActionL1Loss=0.0843 + throughput/total_tokens=540,096,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2814/500000] + train/ActionL1Loss=0.0659 + throughput/total_tokens=540,288,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2815/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=540,480,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2816/500000] + train/ActionL1Loss=0.0889 + throughput/total_tokens=540,672,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2817/500000] + train/ActionL1Loss=0.0813 + throughput/total_tokens=540,864,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2818/500000] + train/ActionL1Loss=0.0749 + throughput/total_tokens=541,056,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2819/500000] + train/ActionL1Loss=0.0819 + throughput/total_tokens=541,248,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2820/500000] + optim/total_grad_norm=10.87 + train/ActionL1Loss=0.0623 + throughput/total_tokens=541,440,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=2821/500000] + train/ActionL1Loss=0.0781 + throughput/total_tokens=541,632,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2822/500000] + train/ActionL1Loss=0.0842 + throughput/total_tokens=541,824,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2823/500000] + train/ActionL1Loss=0.0784 + throughput/total_tokens=542,016,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2824/500000] + train/ActionL1Loss=0.0684 + throughput/total_tokens=542,208,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2825/500000] + train/ActionL1Loss=0.0815 + throughput/total_tokens=542,400,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2826/500000] + train/ActionL1Loss=0.0630 + throughput/total_tokens=542,592,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2827/500000] + train/ActionL1Loss=0.0756 + throughput/total_tokens=542,784,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2828/500000] + train/ActionL1Loss=0.0801 + throughput/total_tokens=542,976,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2829/500000] + train/ActionL1Loss=0.0754 + throughput/total_tokens=543,168,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2830/500000] + train/ActionL1Loss=0.0668 + throughput/total_tokens=543,360,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=2831/500000] + train/ActionL1Loss=0.0672 + throughput/total_tokens=543,552,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2832/500000] + train/ActionL1Loss=0.0690 + throughput/total_tokens=543,744,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2833/500000] + train/ActionL1Loss=0.0831 + throughput/total_tokens=543,936,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2834/500000] + train/ActionL1Loss=0.0672 + throughput/total_tokens=544,128,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2835/500000] + train/ActionL1Loss=0.0720 + throughput/total_tokens=544,320,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2836/500000] + train/ActionL1Loss=0.0868 + throughput/total_tokens=544,512,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=2837/500000] + train/ActionL1Loss=0.0665 + throughput/total_tokens=544,704,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=2838/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=544,896,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2839/500000] + train/ActionL1Loss=0.0659 + throughput/total_tokens=545,088,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=2840/500000] + optim/total_grad_norm=8.631 + train/ActionL1Loss=0.0678 + throughput/total_tokens=545,280,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=2841/500000] + train/ActionL1Loss=0.0689 + throughput/total_tokens=545,472,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2842/500000] + train/ActionL1Loss=0.0639 + throughput/total_tokens=545,664,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2843/500000] + train/ActionL1Loss=0.0698 + throughput/total_tokens=545,856,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2844/500000] + train/ActionL1Loss=0.0869 + throughput/total_tokens=546,048,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2845/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=546,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2846/500000] + train/ActionL1Loss=0.0841 + throughput/total_tokens=546,432,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2847/500000] + train/ActionL1Loss=0.0675 + throughput/total_tokens=546,624,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2848/500000] + train/ActionL1Loss=0.0722 + throughput/total_tokens=546,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2849/500000] + train/ActionL1Loss=0.0665 + throughput/total_tokens=547,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2850/500000] + train/ActionL1Loss=0.0681 + throughput/total_tokens=547,200,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2851/500000] + train/ActionL1Loss=0.0672 + throughput/total_tokens=547,392,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2852/500000] + train/ActionL1Loss=0.0669 + throughput/total_tokens=547,584,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2853/500000] + train/ActionL1Loss=0.0900 + throughput/total_tokens=547,776,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2854/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=547,968,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2855/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=548,160,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2856/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=548,352,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2857/500000] + train/ActionL1Loss=0.0574 + throughput/total_tokens=548,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2858/500000] + train/ActionL1Loss=0.0656 + throughput/total_tokens=548,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2859/500000] + train/ActionL1Loss=0.0800 + throughput/total_tokens=548,928,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2860/500000] + optim/total_grad_norm=9.832 + train/ActionL1Loss=0.0612 + throughput/total_tokens=549,120,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2861/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=549,312,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2862/500000] + train/ActionL1Loss=0.0694 + throughput/total_tokens=549,504,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2863/500000] + train/ActionL1Loss=0.0585 + throughput/total_tokens=549,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2864/500000] + train/ActionL1Loss=0.0639 + throughput/total_tokens=549,888,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2865/500000] + train/ActionL1Loss=0.0660 + throughput/total_tokens=550,080,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2866/500000] + train/ActionL1Loss=0.0708 + throughput/total_tokens=550,272,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2867/500000] + train/ActionL1Loss=0.0697 + throughput/total_tokens=550,464,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2868/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=550,656,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2869/500000] + train/ActionL1Loss=0.0748 + throughput/total_tokens=550,848,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2870/500000] + train/ActionL1Loss=0.0618 + throughput/total_tokens=551,040,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2871/500000] + train/ActionL1Loss=0.0844 + throughput/total_tokens=551,232,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2872/500000] + train/ActionL1Loss=0.0667 + throughput/total_tokens=551,424,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2873/500000] + train/ActionL1Loss=0.0617 + throughput/total_tokens=551,616,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2874/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=551,808,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2875/500000] + train/ActionL1Loss=0.0664 + throughput/total_tokens=552,000,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2876/500000] + train/ActionL1Loss=0.0764 + throughput/total_tokens=552,192,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2877/500000] + train/ActionL1Loss=0.0722 + throughput/total_tokens=552,384,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2878/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=552,576,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2879/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=552,768,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2880/500000] + optim/total_grad_norm=9.555 + train/ActionL1Loss=0.0706 + throughput/total_tokens=552,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2881/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=553,152,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2882/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=553,344,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2883/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=553,536,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2884/500000] + train/ActionL1Loss=0.0691 + throughput/total_tokens=553,728,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2885/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=553,920,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2886/500000] + train/ActionL1Loss=0.0667 + throughput/total_tokens=554,112,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2887/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=554,304,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2888/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=554,496,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2889/500000] + train/ActionL1Loss=0.0629 + throughput/total_tokens=554,688,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2890/500000] + train/ActionL1Loss=0.0632 + throughput/total_tokens=554,880,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2891/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=555,072,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2892/500000] + train/ActionL1Loss=0.0653 + throughput/total_tokens=555,264,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2893/500000] + train/ActionL1Loss=0.0751 + throughput/total_tokens=555,456,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2894/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=555,648,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2895/500000] + train/ActionL1Loss=0.0601 + throughput/total_tokens=555,840,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2896/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=556,032,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2897/500000] + train/ActionL1Loss=0.0787 + throughput/total_tokens=556,224,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2898/500000] + train/ActionL1Loss=0.0750 + throughput/total_tokens=556,416,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2899/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=556,608,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2900/500000] + optim/total_grad_norm=8.648 + train/ActionL1Loss=0.0672 + throughput/total_tokens=556,800,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2901/500000] + train/ActionL1Loss=0.0658 + throughput/total_tokens=556,992,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=2902/500000] + train/ActionL1Loss=0.0674 + throughput/total_tokens=557,184,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2903/500000] + train/ActionL1Loss=0.0625 + throughput/total_tokens=557,376,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=2904/500000] + train/ActionL1Loss=0.0712 + throughput/total_tokens=557,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2905/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=557,760,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2906/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=557,952,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2907/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=558,144,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2908/500000] + train/ActionL1Loss=0.0683 + throughput/total_tokens=558,336,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2909/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=558,528,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2910/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=558,720,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2911/500000] + train/ActionL1Loss=0.0685 + throughput/total_tokens=558,912,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2912/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=559,104,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2913/500000] + train/ActionL1Loss=0.0744 + throughput/total_tokens=559,296,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2914/500000] + train/ActionL1Loss=0.0777 + throughput/total_tokens=559,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2915/500000] + train/ActionL1Loss=0.0628 + throughput/total_tokens=559,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2916/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=559,872,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2917/500000] + train/ActionL1Loss=0.0963 + throughput/total_tokens=560,064,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2918/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=560,256,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2919/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=560,448,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2920/500000] + optim/total_grad_norm=8.920 + train/ActionL1Loss=0.0657 + throughput/total_tokens=560,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2921/500000] + train/ActionL1Loss=0.0631 + throughput/total_tokens=560,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2922/500000] + train/ActionL1Loss=0.0735 + throughput/total_tokens=561,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2923/500000] + train/ActionL1Loss=0.0686 + throughput/total_tokens=561,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2924/500000] + train/ActionL1Loss=0.0639 + throughput/total_tokens=561,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2925/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=561,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2926/500000] + train/ActionL1Loss=0.0733 + throughput/total_tokens=561,792,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2927/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=561,984,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2928/500000] + train/ActionL1Loss=0.0666 + throughput/total_tokens=562,176,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2929/500000] + train/ActionL1Loss=0.0626 + throughput/total_tokens=562,368,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2930/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=562,560,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2931/500000] + train/ActionL1Loss=0.0736 + throughput/total_tokens=562,752,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2932/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=562,944,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2933/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=563,136,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2934/500000] + train/ActionL1Loss=0.0812 + throughput/total_tokens=563,328,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2935/500000] + train/ActionL1Loss=0.0639 + throughput/total_tokens=563,520,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2936/500000] + train/ActionL1Loss=0.0769 + throughput/total_tokens=563,712,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2937/500000] + train/ActionL1Loss=0.0611 + throughput/total_tokens=563,904,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2938/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=564,096,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2939/500000] + train/ActionL1Loss=0.0606 + throughput/total_tokens=564,288,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2940/500000] + optim/total_grad_norm=9.026 + train/ActionL1Loss=0.0696 + throughput/total_tokens=564,480,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2941/500000] + train/ActionL1Loss=0.0683 + throughput/total_tokens=564,672,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2942/500000] + train/ActionL1Loss=0.0643 + throughput/total_tokens=564,864,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2943/500000] + train/ActionL1Loss=0.0749 + throughput/total_tokens=565,056,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2944/500000] + train/ActionL1Loss=0.0691 + throughput/total_tokens=565,248,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2945/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=565,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2946/500000] + train/ActionL1Loss=0.0829 + throughput/total_tokens=565,632,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2947/500000] + train/ActionL1Loss=0.0727 + throughput/total_tokens=565,824,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=2948/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=566,016,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2949/500000] + train/ActionL1Loss=0.0619 + throughput/total_tokens=566,208,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2950/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=566,400,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2951/500000] + train/ActionL1Loss=0.0680 + throughput/total_tokens=566,592,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2952/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=566,784,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=2953/500000] + train/ActionL1Loss=0.0648 + throughput/total_tokens=566,976,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2954/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=567,168,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2955/500000] + train/ActionL1Loss=0.0795 + throughput/total_tokens=567,360,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2956/500000] + train/ActionL1Loss=0.0765 + throughput/total_tokens=567,552,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2957/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=567,744,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2958/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=567,936,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2959/500000] + train/ActionL1Loss=0.0741 + throughput/total_tokens=568,128,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2960/500000] + optim/total_grad_norm=8.936 + train/ActionL1Loss=0.0710 + throughput/total_tokens=568,320,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=2961/500000] + train/ActionL1Loss=0.0692 + throughput/total_tokens=568,512,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2962/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=568,704,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2963/500000] + train/ActionL1Loss=0.0745 + throughput/total_tokens=568,896,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2964/500000] + train/ActionL1Loss=0.0851 + throughput/total_tokens=569,088,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2965/500000] + train/ActionL1Loss=0.0601 + throughput/total_tokens=569,280,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2966/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=569,472,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2967/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=569,664,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2968/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=569,856,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=2969/500000] + train/ActionL1Loss=0.0650 + throughput/total_tokens=570,048,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=2970/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=570,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=2971/500000] + train/ActionL1Loss=0.0750 + throughput/total_tokens=570,432,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=2972/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=570,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=2973/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=570,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2974/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=571,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2975/500000] + train/ActionL1Loss=0.0702 + throughput/total_tokens=571,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2976/500000] + train/ActionL1Loss=0.0625 + throughput/total_tokens=571,392,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2977/500000] + train/ActionL1Loss=0.0732 + throughput/total_tokens=571,584,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2978/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=571,776,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2979/500000] + train/ActionL1Loss=0.0643 + throughput/total_tokens=571,968,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=2980/500000] + optim/total_grad_norm=8.384 + train/ActionL1Loss=0.0806 + throughput/total_tokens=572,160,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2981/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=572,352,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2982/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=572,544,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2983/500000] + train/ActionL1Loss=0.0716 + throughput/total_tokens=572,736,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2984/500000] + train/ActionL1Loss=0.0769 + throughput/total_tokens=572,928,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2985/500000] + train/ActionL1Loss=0.0717 + throughput/total_tokens=573,120,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2986/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=573,312,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2987/500000] + train/ActionL1Loss=0.0694 + throughput/total_tokens=573,504,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2988/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=573,696,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2989/500000] + train/ActionL1Loss=0.0635 + throughput/total_tokens=573,888,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2990/500000] + train/ActionL1Loss=0.0696 + throughput/total_tokens=574,080,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=2991/500000] + train/ActionL1Loss=0.0728 + throughput/total_tokens=574,272,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2992/500000] + train/ActionL1Loss=0.0693 + throughput/total_tokens=574,464,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2993/500000] + train/ActionL1Loss=0.0657 + throughput/total_tokens=574,656,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2994/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=574,848,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2995/500000] + train/ActionL1Loss=0.0584 + throughput/total_tokens=575,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2996/500000] + train/ActionL1Loss=0.0635 + throughput/total_tokens=575,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2997/500000] + train/ActionL1Loss=0.0629 + throughput/total_tokens=575,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2998/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=575,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=2999/500000] + train/ActionL1Loss=0.0606 + throughput/total_tokens=575,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3000/500000] + optim/total_grad_norm=9.807 + train/ActionL1Loss=0.0804 + throughput/total_tokens=576,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +10/12 [10:04:47] INFO | >> Saving config... checkpoint.py:608 +10/12 [10:05:31] INFO | >> Saving model state... checkpoint.py:796 +10/12 [10:06:41] INFO | >> Saving optim state... checkpoint.py:811 +10/12 [10:08:12] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=3001/500000] + train/ActionL1Loss=0.0745 + throughput/total_tokens=576,192,000 + throughput/device/tokens_per_second=1,213 + throughput/device/batches_per_second=0.0506 +[step=3002/500000] + train/ActionL1Loss=0.0701 + throughput/total_tokens=576,384,000 + throughput/device/tokens_per_second=1,184 + throughput/device/batches_per_second=0.0493 +[step=3003/500000] + train/ActionL1Loss=0.0624 + throughput/total_tokens=576,576,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3004/500000] + train/ActionL1Loss=0.0712 + throughput/total_tokens=576,768,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3005/500000] + train/ActionL1Loss=0.0762 + throughput/total_tokens=576,960,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3006/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=577,152,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3007/500000] + train/ActionL1Loss=0.0779 + throughput/total_tokens=577,344,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3008/500000] + train/ActionL1Loss=0.0728 + throughput/total_tokens=577,536,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3009/500000] + train/ActionL1Loss=0.0698 + throughput/total_tokens=577,728,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3010/500000] + train/ActionL1Loss=0.0773 + throughput/total_tokens=577,920,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=3011/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=578,112,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3012/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=578,304,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3013/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=578,496,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3014/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=578,688,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3015/500000] + train/ActionL1Loss=0.0666 + throughput/total_tokens=578,880,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3016/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=579,072,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3017/500000] + train/ActionL1Loss=0.0785 + throughput/total_tokens=579,264,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3018/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=579,456,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3019/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=579,648,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3020/500000] + optim/total_grad_norm=8.776 + train/ActionL1Loss=0.0636 + throughput/total_tokens=579,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3021/500000] + train/ActionL1Loss=0.0792 + throughput/total_tokens=580,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3022/500000] + train/ActionL1Loss=0.0744 + throughput/total_tokens=580,224,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3023/500000] + train/ActionL1Loss=0.0650 + throughput/total_tokens=580,416,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3024/500000] + train/ActionL1Loss=0.0687 + throughput/total_tokens=580,608,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3025/500000] + train/ActionL1Loss=0.0705 + throughput/total_tokens=580,800,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3026/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=580,992,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3027/500000] + train/ActionL1Loss=0.0632 + throughput/total_tokens=581,184,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3028/500000] + train/ActionL1Loss=0.0663 + throughput/total_tokens=581,376,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3029/500000] + train/ActionL1Loss=0.0646 + throughput/total_tokens=581,568,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3030/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=581,760,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3031/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=581,952,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3032/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=582,144,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3033/500000] + train/ActionL1Loss=0.0734 + throughput/total_tokens=582,336,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3034/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=582,528,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3035/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=582,720,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3036/500000] + train/ActionL1Loss=0.0695 + throughput/total_tokens=582,912,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3037/500000] + train/ActionL1Loss=0.0600 + throughput/total_tokens=583,104,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3038/500000] + train/ActionL1Loss=0.0659 + throughput/total_tokens=583,296,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3039/500000] + train/ActionL1Loss=0.0651 + throughput/total_tokens=583,488,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3040/500000] + optim/total_grad_norm=7.621 + train/ActionL1Loss=0.0526 + throughput/total_tokens=583,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3041/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=583,872,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=3042/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=584,064,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3043/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=584,256,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3044/500000] + train/ActionL1Loss=0.0750 + throughput/total_tokens=584,448,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=3045/500000] + train/ActionL1Loss=0.0611 + throughput/total_tokens=584,640,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3046/500000] + train/ActionL1Loss=0.0601 + throughput/total_tokens=584,832,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3047/500000] + train/ActionL1Loss=0.0625 + throughput/total_tokens=585,024,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3048/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=585,216,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3049/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=585,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=3050/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=585,600,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3051/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=585,792,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3052/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=585,984,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=3053/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=586,176,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=3054/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=586,368,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=3055/500000] + train/ActionL1Loss=0.0638 + throughput/total_tokens=586,560,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=3056/500000] + train/ActionL1Loss=0.0642 + throughput/total_tokens=586,752,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=3057/500000] + train/ActionL1Loss=0.0696 + throughput/total_tokens=586,944,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=3058/500000] + train/ActionL1Loss=0.0676 + throughput/total_tokens=587,136,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=3059/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=587,328,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=3060/500000] + optim/total_grad_norm=9.469 + train/ActionL1Loss=0.0649 + throughput/total_tokens=587,520,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=3061/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=587,712,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3062/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=587,904,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3063/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=588,096,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3064/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=588,288,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3065/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=588,480,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3066/500000] + train/ActionL1Loss=0.0783 + throughput/total_tokens=588,672,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3067/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=588,864,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3068/500000] + train/ActionL1Loss=0.0617 + throughput/total_tokens=589,056,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3069/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=589,248,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=3070/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=589,440,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3071/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=589,632,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3072/500000] + train/ActionL1Loss=0.0715 + throughput/total_tokens=589,824,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3073/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=590,016,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3074/500000] + train/ActionL1Loss=0.0669 + throughput/total_tokens=590,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3075/500000] + train/ActionL1Loss=0.0632 + throughput/total_tokens=590,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3076/500000] + train/ActionL1Loss=0.0629 + throughput/total_tokens=590,592,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3077/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=590,784,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3078/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=590,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3079/500000] + train/ActionL1Loss=0.0627 + throughput/total_tokens=591,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3080/500000] + optim/total_grad_norm=10.01 + train/ActionL1Loss=0.0543 + throughput/total_tokens=591,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3081/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=591,552,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3082/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=591,744,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3083/500000] + train/ActionL1Loss=0.0790 + throughput/total_tokens=591,936,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3084/500000] + train/ActionL1Loss=0.0776 + throughput/total_tokens=592,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3085/500000] + train/ActionL1Loss=0.0854 + throughput/total_tokens=592,320,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3086/500000] + train/ActionL1Loss=0.0763 + throughput/total_tokens=592,512,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3087/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=592,704,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3088/500000] + train/ActionL1Loss=0.0740 + throughput/total_tokens=592,896,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3089/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=593,088,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3090/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=593,280,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3091/500000] + train/ActionL1Loss=0.0764 + throughput/total_tokens=593,472,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3092/500000] + train/ActionL1Loss=0.0768 + throughput/total_tokens=593,664,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3093/500000] + train/ActionL1Loss=0.0814 + throughput/total_tokens=593,856,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3094/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=594,048,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3095/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=594,240,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3096/500000] + train/ActionL1Loss=0.0858 + throughput/total_tokens=594,432,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3097/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=594,624,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3098/500000] + train/ActionL1Loss=0.0671 + throughput/total_tokens=594,816,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3099/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=595,008,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3100/500000] + optim/total_grad_norm=10.38 + train/ActionL1Loss=0.0556 + throughput/total_tokens=595,200,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=3101/500000] + train/ActionL1Loss=0.0686 + throughput/total_tokens=595,392,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3102/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=595,584,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3103/500000] + train/ActionL1Loss=0.0691 + throughput/total_tokens=595,776,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3104/500000] + train/ActionL1Loss=0.0684 + throughput/total_tokens=595,968,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3105/500000] + train/ActionL1Loss=0.0584 + throughput/total_tokens=596,160,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3106/500000] + train/ActionL1Loss=0.0748 + throughput/total_tokens=596,352,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3107/500000] + train/ActionL1Loss=0.0801 + throughput/total_tokens=596,544,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3108/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=596,736,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3109/500000] + train/ActionL1Loss=0.0703 + throughput/total_tokens=596,928,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3110/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=597,120,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3111/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=597,312,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3112/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=597,504,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3113/500000] + train/ActionL1Loss=0.0632 + throughput/total_tokens=597,696,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=3114/500000] + train/ActionL1Loss=0.0684 + throughput/total_tokens=597,888,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=3115/500000] + train/ActionL1Loss=0.0753 + throughput/total_tokens=598,080,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=3116/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=598,272,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3117/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=598,464,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3118/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=598,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3119/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=598,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3120/500000] + optim/total_grad_norm=8.330 + train/ActionL1Loss=0.0512 + throughput/total_tokens=599,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3121/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=599,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3122/500000] + train/ActionL1Loss=0.0654 + throughput/total_tokens=599,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3123/500000] + train/ActionL1Loss=0.0716 + throughput/total_tokens=599,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3124/500000] + train/ActionL1Loss=0.0763 + throughput/total_tokens=599,808,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3125/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=600,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3126/500000] + train/ActionL1Loss=0.0671 + throughput/total_tokens=600,192,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3127/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=600,384,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3128/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=600,576,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3129/500000] + train/ActionL1Loss=0.0750 + throughput/total_tokens=600,768,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3130/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=600,960,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3131/500000] + train/ActionL1Loss=0.0719 + throughput/total_tokens=601,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3132/500000] + train/ActionL1Loss=0.0643 + throughput/total_tokens=601,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3133/500000] + train/ActionL1Loss=0.0624 + throughput/total_tokens=601,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3134/500000] + train/ActionL1Loss=0.0785 + throughput/total_tokens=601,728,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3135/500000] + train/ActionL1Loss=0.0682 + throughput/total_tokens=601,920,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3136/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=602,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3137/500000] + train/ActionL1Loss=0.0680 + throughput/total_tokens=602,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3138/500000] + train/ActionL1Loss=0.0703 + throughput/total_tokens=602,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3139/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=602,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3140/500000] + optim/total_grad_norm=9.829 + train/ActionL1Loss=0.0812 + throughput/total_tokens=602,880,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3141/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=603,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3142/500000] + train/ActionL1Loss=0.0648 + throughput/total_tokens=603,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3143/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=603,456,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3144/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=603,648,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3145/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=603,840,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3146/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=604,032,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=3147/500000] + train/ActionL1Loss=0.0688 + throughput/total_tokens=604,224,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3148/500000] + train/ActionL1Loss=0.0658 + throughput/total_tokens=604,416,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3149/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=604,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3150/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=604,800,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3151/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=604,992,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3152/500000] + train/ActionL1Loss=0.0638 + throughput/total_tokens=605,184,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3153/500000] + train/ActionL1Loss=0.0723 + throughput/total_tokens=605,376,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3154/500000] + train/ActionL1Loss=0.0601 + throughput/total_tokens=605,568,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3155/500000] + train/ActionL1Loss=0.0771 + throughput/total_tokens=605,760,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3156/500000] + train/ActionL1Loss=0.0624 + throughput/total_tokens=605,952,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3157/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=606,144,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3158/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=606,336,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3159/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=606,528,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3160/500000] + optim/total_grad_norm=7.991 + train/ActionL1Loss=0.0664 + throughput/total_tokens=606,720,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3161/500000] + train/ActionL1Loss=0.0822 + throughput/total_tokens=606,912,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3162/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=607,104,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3163/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=607,296,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3164/500000] + train/ActionL1Loss=0.0630 + throughput/total_tokens=607,488,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3165/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=607,680,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3166/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=607,872,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3167/500000] + train/ActionL1Loss=0.0686 + throughput/total_tokens=608,064,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3168/500000] + train/ActionL1Loss=0.0646 + throughput/total_tokens=608,256,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3169/500000] + train/ActionL1Loss=0.0740 + throughput/total_tokens=608,448,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3170/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=608,640,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3171/500000] + train/ActionL1Loss=0.0702 + throughput/total_tokens=608,832,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3172/500000] + train/ActionL1Loss=0.0632 + throughput/total_tokens=609,024,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3173/500000] + train/ActionL1Loss=0.0645 + throughput/total_tokens=609,216,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3174/500000] + train/ActionL1Loss=0.0765 + throughput/total_tokens=609,408,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3175/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=609,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3176/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=609,792,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3177/500000] + train/ActionL1Loss=0.0801 + throughput/total_tokens=609,984,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3178/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=610,176,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3179/500000] + train/ActionL1Loss=0.0721 + throughput/total_tokens=610,368,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3180/500000] + optim/total_grad_norm=9.146 + train/ActionL1Loss=0.0624 + throughput/total_tokens=610,560,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3181/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=610,752,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3182/500000] + train/ActionL1Loss=0.0704 + throughput/total_tokens=610,944,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3183/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=611,136,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3184/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=611,328,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3185/500000] + train/ActionL1Loss=0.0615 + throughput/total_tokens=611,520,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3186/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=611,712,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3187/500000] + train/ActionL1Loss=0.0669 + throughput/total_tokens=611,904,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3188/500000] + train/ActionL1Loss=0.0727 + throughput/total_tokens=612,096,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3189/500000] + train/ActionL1Loss=0.0673 + throughput/total_tokens=612,288,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3190/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=612,480,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3191/500000] + train/ActionL1Loss=0.0635 + throughput/total_tokens=612,672,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3192/500000] + train/ActionL1Loss=0.0626 + throughput/total_tokens=612,864,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3193/500000] + train/ActionL1Loss=0.0683 + throughput/total_tokens=613,056,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3194/500000] + train/ActionL1Loss=0.0717 + throughput/total_tokens=613,248,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3195/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=613,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3196/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=613,632,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3197/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=613,824,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3198/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=614,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3199/500000] + train/ActionL1Loss=0.0667 + throughput/total_tokens=614,208,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3200/500000] + optim/total_grad_norm=10.50 + train/ActionL1Loss=0.0753 + throughput/total_tokens=614,400,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3201/500000] + train/ActionL1Loss=0.0705 + throughput/total_tokens=614,592,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3202/500000] + train/ActionL1Loss=0.0654 + throughput/total_tokens=614,784,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3203/500000] + train/ActionL1Loss=0.0707 + throughput/total_tokens=614,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3204/500000] + train/ActionL1Loss=0.0750 + throughput/total_tokens=615,168,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3205/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=615,360,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3206/500000] + train/ActionL1Loss=0.0763 + throughput/total_tokens=615,552,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3207/500000] + train/ActionL1Loss=0.0676 + throughput/total_tokens=615,744,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3208/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=615,936,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3209/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=616,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3210/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=616,320,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3211/500000] + train/ActionL1Loss=0.0631 + throughput/total_tokens=616,512,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3212/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=616,704,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3213/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=616,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3214/500000] + train/ActionL1Loss=0.0744 + throughput/total_tokens=617,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3215/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=617,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3216/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=617,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=3217/500000] + train/ActionL1Loss=0.0699 + throughput/total_tokens=617,664,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=3218/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=617,856,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3219/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=618,048,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=3220/500000] + optim/total_grad_norm=7.879 + train/ActionL1Loss=0.0671 + throughput/total_tokens=618,240,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3221/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=618,432,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3222/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=618,624,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3223/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=618,816,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3224/500000] + train/ActionL1Loss=0.0574 + throughput/total_tokens=619,008,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3225/500000] + train/ActionL1Loss=0.0651 + throughput/total_tokens=619,200,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3226/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=619,392,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3227/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=619,584,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3228/500000] + train/ActionL1Loss=0.0659 + throughput/total_tokens=619,776,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3229/500000] + train/ActionL1Loss=0.0770 + throughput/total_tokens=619,968,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3230/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=620,160,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3231/500000] + train/ActionL1Loss=0.0753 + throughput/total_tokens=620,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3232/500000] + train/ActionL1Loss=0.0664 + throughput/total_tokens=620,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3233/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=620,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3234/500000] + train/ActionL1Loss=0.0711 + throughput/total_tokens=620,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3235/500000] + train/ActionL1Loss=0.0701 + throughput/total_tokens=621,120,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3236/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=621,312,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3237/500000] + train/ActionL1Loss=0.0697 + throughput/total_tokens=621,504,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3238/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=621,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3239/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=621,888,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3240/500000] + optim/total_grad_norm=9.791 + train/ActionL1Loss=0.0706 + throughput/total_tokens=622,080,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3241/500000] + train/ActionL1Loss=0.0821 + throughput/total_tokens=622,272,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3242/500000] + train/ActionL1Loss=0.0704 + throughput/total_tokens=622,464,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3243/500000] + train/ActionL1Loss=0.0628 + throughput/total_tokens=622,656,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3244/500000] + train/ActionL1Loss=0.0745 + throughput/total_tokens=622,848,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3245/500000] + train/ActionL1Loss=0.0624 + throughput/total_tokens=623,040,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3246/500000] + train/ActionL1Loss=0.0701 + throughput/total_tokens=623,232,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3247/500000] + train/ActionL1Loss=0.0562 + throughput/total_tokens=623,424,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3248/500000] + train/ActionL1Loss=0.0617 + throughput/total_tokens=623,616,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3249/500000] + train/ActionL1Loss=0.0631 + throughput/total_tokens=623,808,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3250/500000] + train/ActionL1Loss=0.0629 + throughput/total_tokens=624,000,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3251/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=624,192,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3252/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=624,384,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3253/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=624,576,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3254/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=624,768,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3255/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=624,960,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3256/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=625,152,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3257/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=625,344,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3258/500000] + train/ActionL1Loss=0.0694 + throughput/total_tokens=625,536,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3259/500000] + train/ActionL1Loss=0.0686 + throughput/total_tokens=625,728,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3260/500000] + optim/total_grad_norm=8.580 + train/ActionL1Loss=0.0720 + throughput/total_tokens=625,920,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3261/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=626,112,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3262/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=626,304,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3263/500000] + train/ActionL1Loss=0.0671 + throughput/total_tokens=626,496,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3264/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=626,688,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=3265/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=626,880,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3266/500000] + train/ActionL1Loss=0.0661 + throughput/total_tokens=627,072,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3267/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=627,264,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3268/500000] + train/ActionL1Loss=0.0623 + throughput/total_tokens=627,456,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3269/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=627,648,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3270/500000] + train/ActionL1Loss=0.0785 + throughput/total_tokens=627,840,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3271/500000] + train/ActionL1Loss=0.0626 + throughput/total_tokens=628,032,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3272/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=628,224,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3273/500000] + train/ActionL1Loss=0.0670 + throughput/total_tokens=628,416,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3274/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=628,608,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3275/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=628,800,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3276/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=628,992,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3277/500000] + train/ActionL1Loss=0.0639 + throughput/total_tokens=629,184,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3278/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=629,376,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3279/500000] + train/ActionL1Loss=0.0625 + throughput/total_tokens=629,568,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3280/500000] + optim/total_grad_norm=10.93 + train/ActionL1Loss=0.0639 + throughput/total_tokens=629,760,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3281/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=629,952,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3282/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=630,144,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3283/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=630,336,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3284/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=630,528,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3285/500000] + train/ActionL1Loss=0.0669 + throughput/total_tokens=630,720,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3286/500000] + train/ActionL1Loss=0.0616 + throughput/total_tokens=630,912,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3287/500000] + train/ActionL1Loss=0.0712 + throughput/total_tokens=631,104,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3288/500000] + train/ActionL1Loss=0.0584 + throughput/total_tokens=631,296,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3289/500000] + train/ActionL1Loss=0.0762 + throughput/total_tokens=631,488,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3290/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=631,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3291/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=631,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3292/500000] + train/ActionL1Loss=0.0642 + throughput/total_tokens=632,064,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3293/500000] + train/ActionL1Loss=0.0606 + throughput/total_tokens=632,256,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3294/500000] + train/ActionL1Loss=0.0665 + throughput/total_tokens=632,448,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3295/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=632,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3296/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=632,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3297/500000] + train/ActionL1Loss=0.0770 + throughput/total_tokens=633,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3298/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=633,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3299/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=633,408,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3300/500000] + optim/total_grad_norm=10.67 + train/ActionL1Loss=0.0611 + throughput/total_tokens=633,600,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3301/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=633,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3302/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=633,984,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3303/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=634,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3304/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=634,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3305/500000] + train/ActionL1Loss=0.0611 + throughput/total_tokens=634,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3306/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=634,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3307/500000] + train/ActionL1Loss=0.0615 + throughput/total_tokens=634,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3308/500000] + train/ActionL1Loss=0.0663 + throughput/total_tokens=635,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3309/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=635,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3310/500000] + train/ActionL1Loss=0.0601 + throughput/total_tokens=635,520,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3311/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=635,712,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3312/500000] + train/ActionL1Loss=0.0717 + throughput/total_tokens=635,904,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3313/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=636,096,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3314/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=636,288,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3315/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=636,480,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3316/500000] + train/ActionL1Loss=0.0709 + throughput/total_tokens=636,672,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3317/500000] + train/ActionL1Loss=0.0611 + throughput/total_tokens=636,864,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3318/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=637,056,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3319/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=637,248,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3320/500000] + optim/total_grad_norm=8.253 + train/ActionL1Loss=0.0740 + throughput/total_tokens=637,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3321/500000] + train/ActionL1Loss=0.0634 + throughput/total_tokens=637,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3322/500000] + train/ActionL1Loss=0.0802 + throughput/total_tokens=637,824,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3323/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=638,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3324/500000] + train/ActionL1Loss=0.0624 + throughput/total_tokens=638,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3325/500000] + train/ActionL1Loss=0.0648 + throughput/total_tokens=638,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3326/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=638,592,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3327/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=638,784,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3328/500000] + train/ActionL1Loss=0.0647 + throughput/total_tokens=638,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3329/500000] + train/ActionL1Loss=0.0587 + throughput/total_tokens=639,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3330/500000] + train/ActionL1Loss=0.0564 + throughput/total_tokens=639,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3331/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=639,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3332/500000] + train/ActionL1Loss=0.0759 + throughput/total_tokens=639,744,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3333/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=639,936,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3334/500000] + train/ActionL1Loss=0.0745 + throughput/total_tokens=640,128,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3335/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=640,320,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3336/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=640,512,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3337/500000] + train/ActionL1Loss=0.0644 + throughput/total_tokens=640,704,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3338/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=640,896,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3339/500000] + train/ActionL1Loss=0.0641 + throughput/total_tokens=641,088,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3340/500000] + optim/total_grad_norm=9.166 + train/ActionL1Loss=0.0518 + throughput/total_tokens=641,280,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3341/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=641,472,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3342/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=641,664,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3343/500000] + train/ActionL1Loss=0.0668 + throughput/total_tokens=641,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3344/500000] + train/ActionL1Loss=0.0712 + throughput/total_tokens=642,048,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3345/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=642,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3346/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=642,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3347/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=642,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3348/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=642,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3349/500000] + train/ActionL1Loss=0.0656 + throughput/total_tokens=643,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3350/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=643,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3351/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=643,392,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3352/500000] + train/ActionL1Loss=0.0701 + throughput/total_tokens=643,584,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3353/500000] + train/ActionL1Loss=0.0632 + throughput/total_tokens=643,776,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3354/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=643,968,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=3355/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=644,160,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=3356/500000] + train/ActionL1Loss=0.0766 + throughput/total_tokens=644,352,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3357/500000] + train/ActionL1Loss=0.0643 + throughput/total_tokens=644,544,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3358/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=644,736,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3359/500000] + train/ActionL1Loss=0.0763 + throughput/total_tokens=644,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3360/500000] + optim/total_grad_norm=8.757 + train/ActionL1Loss=0.0762 + throughput/total_tokens=645,120,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3361/500000] + train/ActionL1Loss=0.0696 + throughput/total_tokens=645,312,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3362/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=645,504,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3363/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=645,696,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=3364/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=645,888,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3365/500000] + train/ActionL1Loss=0.0630 + throughput/total_tokens=646,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3366/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=646,272,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3367/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=646,464,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3368/500000] + train/ActionL1Loss=0.0758 + throughput/total_tokens=646,656,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3369/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=646,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3370/500000] + train/ActionL1Loss=0.0625 + throughput/total_tokens=647,040,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3371/500000] + train/ActionL1Loss=0.0772 + throughput/total_tokens=647,232,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3372/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=647,424,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3373/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=647,616,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3374/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=647,808,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3375/500000] + train/ActionL1Loss=0.0606 + throughput/total_tokens=648,000,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3376/500000] + train/ActionL1Loss=0.0648 + throughput/total_tokens=648,192,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3377/500000] + train/ActionL1Loss=0.0757 + throughput/total_tokens=648,384,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3378/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=648,576,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3379/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=648,768,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3380/500000] + optim/total_grad_norm=10.56 + train/ActionL1Loss=0.0556 + throughput/total_tokens=648,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3381/500000] + train/ActionL1Loss=0.0725 + throughput/total_tokens=649,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3382/500000] + train/ActionL1Loss=0.0574 + throughput/total_tokens=649,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3383/500000] + train/ActionL1Loss=0.0623 + throughput/total_tokens=649,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3384/500000] + train/ActionL1Loss=0.0826 + throughput/total_tokens=649,728,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3385/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=649,920,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3386/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=650,112,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3387/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=650,304,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3388/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=650,496,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3389/500000] + train/ActionL1Loss=0.0654 + throughput/total_tokens=650,688,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3390/500000] + train/ActionL1Loss=0.0872 + throughput/total_tokens=650,880,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3391/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=651,072,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3392/500000] + train/ActionL1Loss=0.0704 + throughput/total_tokens=651,264,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3393/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=651,456,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3394/500000] + train/ActionL1Loss=0.0683 + throughput/total_tokens=651,648,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3395/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=651,840,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3396/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=652,032,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3397/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=652,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3398/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=652,416,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3399/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=652,608,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3400/500000] + optim/total_grad_norm=9.209 + train/ActionL1Loss=0.0647 + throughput/total_tokens=652,800,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3401/500000] + train/ActionL1Loss=0.0689 + throughput/total_tokens=652,992,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3402/500000] + train/ActionL1Loss=0.0611 + throughput/total_tokens=653,184,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3403/500000] + train/ActionL1Loss=0.0720 + throughput/total_tokens=653,376,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=3404/500000] + train/ActionL1Loss=0.0630 + throughput/total_tokens=653,568,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=3405/500000] + train/ActionL1Loss=0.0697 + throughput/total_tokens=653,760,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3406/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=653,952,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3407/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=654,144,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3408/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=654,336,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3409/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=654,528,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3410/500000] + train/ActionL1Loss=0.0684 + throughput/total_tokens=654,720,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3411/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=654,912,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3412/500000] + train/ActionL1Loss=0.0616 + throughput/total_tokens=655,104,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3413/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=655,296,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3414/500000] + train/ActionL1Loss=0.0619 + throughput/total_tokens=655,488,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3415/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=655,680,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3416/500000] + train/ActionL1Loss=0.0785 + throughput/total_tokens=655,872,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3417/500000] + train/ActionL1Loss=0.0564 + throughput/total_tokens=656,064,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3418/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=656,256,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3419/500000] + train/ActionL1Loss=0.0627 + throughput/total_tokens=656,448,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3420/500000] + optim/total_grad_norm=9.598 + train/ActionL1Loss=0.0490 + throughput/total_tokens=656,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3421/500000] + train/ActionL1Loss=0.0626 + throughput/total_tokens=656,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3422/500000] + train/ActionL1Loss=0.0784 + throughput/total_tokens=657,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3423/500000] + train/ActionL1Loss=0.0743 + throughput/total_tokens=657,216,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3424/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=657,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3425/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=657,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3426/500000] + train/ActionL1Loss=0.0720 + throughput/total_tokens=657,792,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3427/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=657,984,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3428/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=658,176,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3429/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=658,368,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3430/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=658,560,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3431/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=658,752,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3432/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=658,944,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3433/500000] + train/ActionL1Loss=0.0824 + throughput/total_tokens=659,136,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3434/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=659,328,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3435/500000] + train/ActionL1Loss=0.0703 + throughput/total_tokens=659,520,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3436/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=659,712,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3437/500000] + train/ActionL1Loss=0.0674 + throughput/total_tokens=659,904,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3438/500000] + train/ActionL1Loss=0.0764 + throughput/total_tokens=660,096,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3439/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=660,288,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3440/500000] + optim/total_grad_norm=10.07 + train/ActionL1Loss=0.0697 + throughput/total_tokens=660,480,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=3441/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=660,672,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3442/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=660,864,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3443/500000] + train/ActionL1Loss=0.0667 + throughput/total_tokens=661,056,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3444/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=661,248,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3445/500000] + train/ActionL1Loss=0.0703 + throughput/total_tokens=661,440,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3446/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=661,632,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3447/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=661,824,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3448/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=662,016,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3449/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=662,208,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3450/500000] + train/ActionL1Loss=0.0690 + throughput/total_tokens=662,400,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3451/500000] + train/ActionL1Loss=0.0666 + throughput/total_tokens=662,592,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3452/500000] + train/ActionL1Loss=0.0621 + throughput/total_tokens=662,784,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3453/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=662,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3454/500000] + train/ActionL1Loss=0.0733 + throughput/total_tokens=663,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3455/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=663,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3456/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=663,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3457/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=663,744,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3458/500000] + train/ActionL1Loss=0.0648 + throughput/total_tokens=663,936,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3459/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=664,128,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3460/500000] + optim/total_grad_norm=8.956 + train/ActionL1Loss=0.0505 + throughput/total_tokens=664,320,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3461/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=664,512,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3462/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=664,704,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3463/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=664,896,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3464/500000] + train/ActionL1Loss=0.0766 + throughput/total_tokens=665,088,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3465/500000] + train/ActionL1Loss=0.0665 + throughput/total_tokens=665,280,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3466/500000] + train/ActionL1Loss=0.0845 + throughput/total_tokens=665,472,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3467/500000] + train/ActionL1Loss=0.0779 + throughput/total_tokens=665,664,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3468/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=665,856,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3469/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=666,048,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3470/500000] + train/ActionL1Loss=0.0629 + throughput/total_tokens=666,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3471/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=666,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3472/500000] + train/ActionL1Loss=0.0668 + throughput/total_tokens=666,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3473/500000] + train/ActionL1Loss=0.0661 + throughput/total_tokens=666,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3474/500000] + train/ActionL1Loss=0.0635 + throughput/total_tokens=667,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3475/500000] + train/ActionL1Loss=0.0677 + throughput/total_tokens=667,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3476/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=667,392,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3477/500000] + train/ActionL1Loss=0.0658 + throughput/total_tokens=667,584,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3478/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=667,776,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3479/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=667,968,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3480/500000] + optim/total_grad_norm=9.069 + train/ActionL1Loss=0.0520 + throughput/total_tokens=668,160,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3481/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=668,352,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3482/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=668,544,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3483/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=668,736,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3484/500000] + train/ActionL1Loss=0.0659 + throughput/total_tokens=668,928,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3485/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=669,120,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3486/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=669,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3487/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=669,504,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3488/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=669,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3489/500000] + train/ActionL1Loss=0.0674 + throughput/total_tokens=669,888,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3490/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=670,080,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3491/500000] + train/ActionL1Loss=0.0701 + throughput/total_tokens=670,272,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3492/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=670,464,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3493/500000] + train/ActionL1Loss=0.0707 + throughput/total_tokens=670,656,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3494/500000] + train/ActionL1Loss=0.0562 + throughput/total_tokens=670,848,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3495/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=671,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3496/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=671,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3497/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=671,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3498/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=671,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3499/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=671,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3500/500000] + optim/total_grad_norm=9.452 + train/ActionL1Loss=0.0583 + throughput/total_tokens=672,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +10/12 [12:59:12] INFO | >> Saving config... checkpoint.py:608 +10/12 [12:59:59] INFO | >> Saving model state... checkpoint.py:796 +10/12 [13:01:08] INFO | >> Saving optim state... checkpoint.py:811 +10/12 [13:02:31] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=3501/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=672,192,000 + throughput/device/tokens_per_second=1,210 + throughput/device/batches_per_second=0.0504 +[step=3502/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=672,384,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=3503/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=672,576,000 + throughput/device/tokens_per_second=1,136 + throughput/device/batches_per_second=0.0473 +[step=3504/500000] + train/ActionL1Loss=0.0673 + throughput/total_tokens=672,768,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=3505/500000] + train/ActionL1Loss=0.0615 + throughput/total_tokens=672,960,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=3506/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=673,152,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=3507/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=673,344,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0483 +[step=3508/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=673,536,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=3509/500000] + train/ActionL1Loss=0.0704 + throughput/total_tokens=673,728,000 + throughput/device/tokens_per_second=1,164 + throughput/device/batches_per_second=0.0485 +[step=3510/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=673,920,000 + throughput/device/tokens_per_second=1,165 + throughput/device/batches_per_second=0.0486 + System/Peak GPU Memory (MB)=46,924 +[step=3511/500000] + train/ActionL1Loss=0.0742 + throughput/total_tokens=674,112,000 + throughput/device/tokens_per_second=1,167 + throughput/device/batches_per_second=0.0486 +[step=3512/500000] + train/ActionL1Loss=0.0639 + throughput/total_tokens=674,304,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=3513/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=674,496,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=3514/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=674,688,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=3515/500000] + train/ActionL1Loss=0.0635 + throughput/total_tokens=674,880,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=3516/500000] + train/ActionL1Loss=0.0701 + throughput/total_tokens=675,072,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=3517/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=675,264,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=3518/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=675,456,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=3519/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=675,648,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=3520/500000] + optim/total_grad_norm=9.494 + train/ActionL1Loss=0.0497 + throughput/total_tokens=675,840,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 + System/Peak GPU Memory (MB)=46,924 +[step=3521/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=676,032,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=3522/500000] + train/ActionL1Loss=0.0558 + throughput/total_tokens=676,224,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=3523/500000] + train/ActionL1Loss=0.0630 + throughput/total_tokens=676,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3524/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=676,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3525/500000] + train/ActionL1Loss=0.0630 + throughput/total_tokens=676,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3526/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=676,992,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3527/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=677,184,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3528/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=677,376,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3529/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=677,568,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3530/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=677,760,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3531/500000] + train/ActionL1Loss=0.0685 + throughput/total_tokens=677,952,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3532/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=678,144,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3533/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=678,336,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3534/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=678,528,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3535/500000] + train/ActionL1Loss=0.0661 + throughput/total_tokens=678,720,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3536/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=678,912,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3537/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=679,104,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3538/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=679,296,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3539/500000] + train/ActionL1Loss=0.0643 + throughput/total_tokens=679,488,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3540/500000] + optim/total_grad_norm=10.26 + train/ActionL1Loss=0.0345 + throughput/total_tokens=679,680,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3541/500000] + train/ActionL1Loss=0.0634 + throughput/total_tokens=679,872,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3542/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=680,064,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3543/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=680,256,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3544/500000] + train/ActionL1Loss=0.0686 + throughput/total_tokens=680,448,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3545/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=680,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3546/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=680,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3547/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=681,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3548/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=681,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3549/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=681,408,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3550/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=681,600,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3551/500000] + train/ActionL1Loss=0.0665 + throughput/total_tokens=681,792,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3552/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=681,984,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3553/500000] + train/ActionL1Loss=0.0692 + throughput/total_tokens=682,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3554/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=682,368,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3555/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=682,560,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3556/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=682,752,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3557/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=682,944,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3558/500000] + train/ActionL1Loss=0.0725 + throughput/total_tokens=683,136,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3559/500000] + train/ActionL1Loss=0.0643 + throughput/total_tokens=683,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3560/500000] + optim/total_grad_norm=9.821 + train/ActionL1Loss=0.0674 + throughput/total_tokens=683,520,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3561/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=683,712,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3562/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=683,904,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3563/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=684,096,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3564/500000] + train/ActionL1Loss=0.0632 + throughput/total_tokens=684,288,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3565/500000] + train/ActionL1Loss=0.0664 + throughput/total_tokens=684,480,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3566/500000] + train/ActionL1Loss=0.0682 + throughput/total_tokens=684,672,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3567/500000] + train/ActionL1Loss=0.0607 + throughput/total_tokens=684,864,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=3568/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=685,056,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=3569/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=685,248,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=3570/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=685,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3571/500000] + train/ActionL1Loss=0.0730 + throughput/total_tokens=685,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3572/500000] + train/ActionL1Loss=0.0639 + throughput/total_tokens=685,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3573/500000] + train/ActionL1Loss=0.0729 + throughput/total_tokens=686,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3574/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=686,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3575/500000] + train/ActionL1Loss=0.0601 + throughput/total_tokens=686,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3576/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=686,592,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3577/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=686,784,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3578/500000] + train/ActionL1Loss=0.0727 + throughput/total_tokens=686,976,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3579/500000] + train/ActionL1Loss=0.0774 + throughput/total_tokens=687,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3580/500000] + optim/total_grad_norm=7.989 + train/ActionL1Loss=0.0605 + throughput/total_tokens=687,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3581/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=687,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3582/500000] + train/ActionL1Loss=0.0738 + throughput/total_tokens=687,744,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3583/500000] + train/ActionL1Loss=0.0622 + throughput/total_tokens=687,936,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3584/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=688,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3585/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=688,320,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3586/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=688,512,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3587/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=688,704,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3588/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=688,896,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3589/500000] + train/ActionL1Loss=0.0700 + throughput/total_tokens=689,088,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3590/500000] + train/ActionL1Loss=0.0752 + throughput/total_tokens=689,280,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3591/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=689,472,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3592/500000] + train/ActionL1Loss=0.0805 + throughput/total_tokens=689,664,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3593/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=689,856,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3594/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=690,048,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3595/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=690,240,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3596/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=690,432,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3597/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=690,624,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3598/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=690,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3599/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=691,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3600/500000] + optim/total_grad_norm=8.395 + train/ActionL1Loss=0.0673 + throughput/total_tokens=691,200,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3601/500000] + train/ActionL1Loss=0.0621 + throughput/total_tokens=691,392,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3602/500000] + train/ActionL1Loss=0.0778 + throughput/total_tokens=691,584,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3603/500000] + train/ActionL1Loss=0.0646 + throughput/total_tokens=691,776,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3604/500000] + train/ActionL1Loss=0.0677 + throughput/total_tokens=691,968,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3605/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=692,160,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3606/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=692,352,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3607/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=692,544,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3608/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=692,736,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3609/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=692,928,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3610/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=693,120,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3611/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=693,312,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3612/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=693,504,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3613/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=693,696,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3614/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=693,888,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3615/500000] + train/ActionL1Loss=0.0638 + throughput/total_tokens=694,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3616/500000] + train/ActionL1Loss=0.0685 + throughput/total_tokens=694,272,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3617/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=694,464,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3618/500000] + train/ActionL1Loss=0.0688 + throughput/total_tokens=694,656,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3619/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=694,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3620/500000] + optim/total_grad_norm=9.646 + train/ActionL1Loss=0.0477 + throughput/total_tokens=695,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3621/500000] + train/ActionL1Loss=0.0691 + throughput/total_tokens=695,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3622/500000] + train/ActionL1Loss=0.0688 + throughput/total_tokens=695,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3623/500000] + train/ActionL1Loss=0.0685 + throughput/total_tokens=695,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3624/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=695,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3625/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=696,000,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3626/500000] + train/ActionL1Loss=0.0630 + throughput/total_tokens=696,192,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3627/500000] + train/ActionL1Loss=0.0686 + throughput/total_tokens=696,384,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3628/500000] + train/ActionL1Loss=0.0647 + throughput/total_tokens=696,576,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3629/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=696,768,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3630/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=696,960,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3631/500000] + train/ActionL1Loss=0.0717 + throughput/total_tokens=697,152,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3632/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=697,344,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3633/500000] + train/ActionL1Loss=0.0688 + throughput/total_tokens=697,536,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3634/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=697,728,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3635/500000] + train/ActionL1Loss=0.0701 + throughput/total_tokens=697,920,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3636/500000] + train/ActionL1Loss=0.0657 + throughput/total_tokens=698,112,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3637/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=698,304,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3638/500000] + train/ActionL1Loss=0.0634 + throughput/total_tokens=698,496,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3639/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=698,688,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3640/500000] + optim/total_grad_norm=8.631 + train/ActionL1Loss=0.0451 + throughput/total_tokens=698,880,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3641/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=699,072,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3642/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=699,264,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3643/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=699,456,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3644/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=699,648,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3645/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=699,840,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3646/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=700,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3647/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=700,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3648/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=700,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3649/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=700,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3650/500000] + train/ActionL1Loss=0.0651 + throughput/total_tokens=700,800,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3651/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=700,992,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3652/500000] + train/ActionL1Loss=0.0600 + throughput/total_tokens=701,184,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3653/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=701,376,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3654/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=701,568,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=3655/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=701,760,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=3656/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=701,952,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=3657/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=702,144,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=3658/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=702,336,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=3659/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=702,528,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=3660/500000] + optim/total_grad_norm=9.286 + train/ActionL1Loss=0.0565 + throughput/total_tokens=702,720,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3661/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=702,912,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3662/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=703,104,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3663/500000] + train/ActionL1Loss=0.0669 + throughput/total_tokens=703,296,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3664/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=703,488,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3665/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=703,680,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3666/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=703,872,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3667/500000] + train/ActionL1Loss=0.0669 + throughput/total_tokens=704,064,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3668/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=704,256,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3669/500000] + train/ActionL1Loss=0.0588 + throughput/total_tokens=704,448,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3670/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=704,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3671/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=704,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3672/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=705,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3673/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=705,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3674/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=705,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3675/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=705,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3676/500000] + train/ActionL1Loss=0.0562 + throughput/total_tokens=705,792,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3677/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=705,984,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3678/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=706,176,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3679/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=706,368,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3680/500000] + optim/total_grad_norm=9.823 + train/ActionL1Loss=0.0609 + throughput/total_tokens=706,560,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3681/500000] + train/ActionL1Loss=0.0713 + throughput/total_tokens=706,752,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3682/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=706,944,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3683/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=707,136,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3684/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=707,328,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3685/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=707,520,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3686/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=707,712,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3687/500000] + train/ActionL1Loss=0.0710 + throughput/total_tokens=707,904,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3688/500000] + train/ActionL1Loss=0.0607 + throughput/total_tokens=708,096,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3689/500000] + train/ActionL1Loss=0.0394 + throughput/total_tokens=708,288,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3690/500000] + train/ActionL1Loss=0.0562 + throughput/total_tokens=708,480,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3691/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=708,672,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3692/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=708,864,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3693/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=709,056,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3694/500000] + train/ActionL1Loss=0.0624 + throughput/total_tokens=709,248,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3695/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=709,440,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3696/500000] + train/ActionL1Loss=0.0653 + throughput/total_tokens=709,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3697/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=709,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3698/500000] + train/ActionL1Loss=0.0654 + throughput/total_tokens=710,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3699/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=710,208,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3700/500000] + optim/total_grad_norm=9.523 + train/ActionL1Loss=0.0590 + throughput/total_tokens=710,400,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3701/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=710,592,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3702/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=710,784,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=3703/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=710,976,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3704/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=711,168,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3705/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=711,360,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=3706/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=711,552,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3707/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=711,744,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3708/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=711,936,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3709/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=712,128,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3710/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=712,320,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3711/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=712,512,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3712/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=712,704,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3713/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=712,896,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3714/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=713,088,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3715/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=713,280,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=3716/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=713,472,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3717/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=713,664,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3718/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=713,856,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3719/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=714,048,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3720/500000] + optim/total_grad_norm=8.466 + train/ActionL1Loss=0.0466 + throughput/total_tokens=714,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3721/500000] + train/ActionL1Loss=0.0707 + throughput/total_tokens=714,432,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3722/500000] + train/ActionL1Loss=0.0704 + throughput/total_tokens=714,624,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3723/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=714,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3724/500000] + train/ActionL1Loss=0.0641 + throughput/total_tokens=715,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3725/500000] + train/ActionL1Loss=0.0665 + throughput/total_tokens=715,200,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3726/500000] + train/ActionL1Loss=0.0706 + throughput/total_tokens=715,392,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3727/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=715,584,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3728/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=715,776,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3729/500000] + train/ActionL1Loss=0.0663 + throughput/total_tokens=715,968,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3730/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=716,160,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3731/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=716,352,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3732/500000] + train/ActionL1Loss=0.0601 + throughput/total_tokens=716,544,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3733/500000] + train/ActionL1Loss=0.0696 + throughput/total_tokens=716,736,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3734/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=716,928,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3735/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=717,120,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3736/500000] + train/ActionL1Loss=0.0683 + throughput/total_tokens=717,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3737/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=717,504,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3738/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=717,696,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3739/500000] + train/ActionL1Loss=0.0816 + throughput/total_tokens=717,888,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3740/500000] + optim/total_grad_norm=10.01 + train/ActionL1Loss=0.0689 + throughput/total_tokens=718,080,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3741/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=718,272,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3742/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=718,464,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3743/500000] + train/ActionL1Loss=0.0626 + throughput/total_tokens=718,656,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3744/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=718,848,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3745/500000] + train/ActionL1Loss=0.0643 + throughput/total_tokens=719,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3746/500000] + train/ActionL1Loss=0.0611 + throughput/total_tokens=719,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3747/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=719,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3748/500000] + train/ActionL1Loss=0.0650 + throughput/total_tokens=719,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3749/500000] + train/ActionL1Loss=0.0690 + throughput/total_tokens=719,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3750/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=720,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3751/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=720,192,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3752/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=720,384,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3753/500000] + train/ActionL1Loss=0.0782 + throughput/total_tokens=720,576,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3754/500000] + train/ActionL1Loss=0.0585 + throughput/total_tokens=720,768,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3755/500000] + train/ActionL1Loss=0.0790 + throughput/total_tokens=720,960,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3756/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=721,152,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3757/500000] + train/ActionL1Loss=0.0673 + throughput/total_tokens=721,344,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3758/500000] + train/ActionL1Loss=0.0628 + throughput/total_tokens=721,536,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3759/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=721,728,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3760/500000] + optim/total_grad_norm=8.416 + train/ActionL1Loss=0.0697 + throughput/total_tokens=721,920,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3761/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=722,112,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3762/500000] + train/ActionL1Loss=0.0710 + throughput/total_tokens=722,304,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3763/500000] + train/ActionL1Loss=0.0707 + throughput/total_tokens=722,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3764/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=722,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3765/500000] + train/ActionL1Loss=0.0639 + throughput/total_tokens=722,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3766/500000] + train/ActionL1Loss=0.0558 + throughput/total_tokens=723,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3767/500000] + train/ActionL1Loss=0.0640 + throughput/total_tokens=723,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3768/500000] + train/ActionL1Loss=0.0703 + throughput/total_tokens=723,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3769/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=723,648,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3770/500000] + train/ActionL1Loss=0.0657 + throughput/total_tokens=723,840,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3771/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=724,032,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3772/500000] + train/ActionL1Loss=0.0663 + throughput/total_tokens=724,224,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3773/500000] + train/ActionL1Loss=0.0694 + throughput/total_tokens=724,416,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3774/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=724,608,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3775/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=724,800,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3776/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=724,992,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3777/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=725,184,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3778/500000] + train/ActionL1Loss=0.0698 + throughput/total_tokens=725,376,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3779/500000] + train/ActionL1Loss=0.0588 + throughput/total_tokens=725,568,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3780/500000] + optim/total_grad_norm=8.094 + train/ActionL1Loss=0.0625 + throughput/total_tokens=725,760,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3781/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=725,952,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3782/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=726,144,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3783/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=726,336,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3784/500000] + train/ActionL1Loss=0.0724 + throughput/total_tokens=726,528,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3785/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=726,720,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3786/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=726,912,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3787/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=727,104,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3788/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=727,296,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3789/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=727,488,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3790/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=727,680,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3791/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=727,872,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3792/500000] + train/ActionL1Loss=0.0653 + throughput/total_tokens=728,064,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3793/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=728,256,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3794/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=728,448,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3795/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=728,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3796/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=728,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3797/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=729,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3798/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=729,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3799/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=729,408,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3800/500000] + optim/total_grad_norm=9.655 + train/ActionL1Loss=0.0458 + throughput/total_tokens=729,600,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3801/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=729,792,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3802/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=729,984,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3803/500000] + train/ActionL1Loss=0.0839 + throughput/total_tokens=730,176,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3804/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=730,368,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=3805/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=730,560,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=3806/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=730,752,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3807/500000] + train/ActionL1Loss=0.0845 + throughput/total_tokens=730,944,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3808/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=731,136,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3809/500000] + train/ActionL1Loss=0.0699 + throughput/total_tokens=731,328,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3810/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=731,520,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=3811/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=731,712,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3812/500000] + train/ActionL1Loss=0.0645 + throughput/total_tokens=731,904,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3813/500000] + train/ActionL1Loss=0.0679 + throughput/total_tokens=732,096,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=3814/500000] + train/ActionL1Loss=0.0672 + throughput/total_tokens=732,288,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=3815/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=732,480,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3816/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=732,672,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3817/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=732,864,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3818/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=733,056,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3819/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=733,248,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3820/500000] + optim/total_grad_norm=9.217 + train/ActionL1Loss=0.0670 + throughput/total_tokens=733,440,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3821/500000] + train/ActionL1Loss=0.0697 + throughput/total_tokens=733,632,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3822/500000] + train/ActionL1Loss=0.0711 + throughput/total_tokens=733,824,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3823/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=734,016,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3824/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=734,208,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3825/500000] + train/ActionL1Loss=0.0601 + throughput/total_tokens=734,400,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3826/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=734,592,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3827/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=734,784,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3828/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=734,976,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3829/500000] + train/ActionL1Loss=0.0588 + throughput/total_tokens=735,168,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3830/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=735,360,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=3831/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=735,552,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3832/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=735,744,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3833/500000] + train/ActionL1Loss=0.0667 + throughput/total_tokens=735,936,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3834/500000] + train/ActionL1Loss=0.0736 + throughput/total_tokens=736,128,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3835/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=736,320,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3836/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=736,512,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3837/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=736,704,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3838/500000] + train/ActionL1Loss=0.0661 + throughput/total_tokens=736,896,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3839/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=737,088,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3840/500000] + optim/total_grad_norm=7.985 + train/ActionL1Loss=0.0671 + throughput/total_tokens=737,280,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=3841/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=737,472,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3842/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=737,664,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3843/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=737,856,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3844/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=738,048,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3845/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=738,240,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3846/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=738,432,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3847/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=738,624,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3848/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=738,816,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3849/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=739,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3850/500000] + train/ActionL1Loss=0.0670 + throughput/total_tokens=739,200,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3851/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=739,392,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3852/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=739,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3853/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=739,776,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3854/500000] + train/ActionL1Loss=0.0611 + throughput/total_tokens=739,968,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3855/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=740,160,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3856/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=740,352,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3857/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=740,544,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3858/500000] + train/ActionL1Loss=0.0766 + throughput/total_tokens=740,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3859/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=740,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3860/500000] + optim/total_grad_norm=9.539 + train/ActionL1Loss=0.0780 + throughput/total_tokens=741,120,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=3861/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=741,312,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3862/500000] + train/ActionL1Loss=0.0724 + throughput/total_tokens=741,504,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3863/500000] + train/ActionL1Loss=0.0658 + throughput/total_tokens=741,696,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3864/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=741,888,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=3865/500000] + train/ActionL1Loss=0.0738 + throughput/total_tokens=742,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3866/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=742,272,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3867/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=742,464,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3868/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=742,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3869/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=742,848,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=3870/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=743,040,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3871/500000] + train/ActionL1Loss=0.0697 + throughput/total_tokens=743,232,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3872/500000] + train/ActionL1Loss=0.0564 + throughput/total_tokens=743,424,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3873/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=743,616,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3874/500000] + train/ActionL1Loss=0.0622 + throughput/total_tokens=743,808,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3875/500000] + train/ActionL1Loss=0.0732 + throughput/total_tokens=744,000,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3876/500000] + train/ActionL1Loss=0.0774 + throughput/total_tokens=744,192,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3877/500000] + train/ActionL1Loss=0.0648 + throughput/total_tokens=744,384,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=3878/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=744,576,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3879/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=744,768,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3880/500000] + optim/total_grad_norm=6.861 + train/ActionL1Loss=0.0558 + throughput/total_tokens=744,960,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3881/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=745,152,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3882/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=745,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3883/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=745,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3884/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=745,728,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3885/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=745,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3886/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=746,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3887/500000] + train/ActionL1Loss=0.0623 + throughput/total_tokens=746,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3888/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=746,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3889/500000] + train/ActionL1Loss=0.0600 + throughput/total_tokens=746,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3890/500000] + train/ActionL1Loss=0.0755 + throughput/total_tokens=746,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3891/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=747,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3892/500000] + train/ActionL1Loss=0.0645 + throughput/total_tokens=747,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3893/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=747,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3894/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=747,648,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3895/500000] + train/ActionL1Loss=0.0734 + throughput/total_tokens=747,840,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3896/500000] + train/ActionL1Loss=0.0644 + throughput/total_tokens=748,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3897/500000] + train/ActionL1Loss=0.0656 + throughput/total_tokens=748,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3898/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=748,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3899/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=748,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3900/500000] + optim/total_grad_norm=6.437 + train/ActionL1Loss=0.0643 + throughput/total_tokens=748,800,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3901/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=748,992,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3902/500000] + train/ActionL1Loss=0.0629 + throughput/total_tokens=749,184,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3903/500000] + train/ActionL1Loss=0.0606 + throughput/total_tokens=749,376,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3904/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=749,568,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3905/500000] + train/ActionL1Loss=0.0562 + throughput/total_tokens=749,760,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3906/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=749,952,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3907/500000] + train/ActionL1Loss=0.0674 + throughput/total_tokens=750,144,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3908/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=750,336,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3909/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=750,528,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3910/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=750,720,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3911/500000] + train/ActionL1Loss=0.0588 + throughput/total_tokens=750,912,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3912/500000] + train/ActionL1Loss=0.0671 + throughput/total_tokens=751,104,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3913/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=751,296,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3914/500000] + train/ActionL1Loss=0.0627 + throughput/total_tokens=751,488,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3915/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=751,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3916/500000] + train/ActionL1Loss=0.0641 + throughput/total_tokens=751,872,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3917/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=752,064,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3918/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=752,256,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3919/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=752,448,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3920/500000] + optim/total_grad_norm=8.683 + train/ActionL1Loss=0.0494 + throughput/total_tokens=752,640,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3921/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=752,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3922/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=753,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3923/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=753,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3924/500000] + train/ActionL1Loss=0.0731 + throughput/total_tokens=753,408,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3925/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=753,600,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3926/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=753,792,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3927/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=753,984,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3928/500000] + train/ActionL1Loss=0.0726 + throughput/total_tokens=754,176,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3929/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=754,368,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3930/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=754,560,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3931/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=754,752,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3932/500000] + train/ActionL1Loss=0.0675 + throughput/total_tokens=754,944,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3933/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=755,136,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3934/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=755,328,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3935/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=755,520,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3936/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=755,712,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3937/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=755,904,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3938/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=756,096,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3939/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=756,288,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3940/500000] + optim/total_grad_norm=8.858 + train/ActionL1Loss=0.0555 + throughput/total_tokens=756,480,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3941/500000] + train/ActionL1Loss=0.0751 + throughput/total_tokens=756,672,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3942/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=756,864,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3943/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=757,056,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3944/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=757,248,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3945/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=757,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3946/500000] + train/ActionL1Loss=0.0623 + throughput/total_tokens=757,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3947/500000] + train/ActionL1Loss=0.0658 + throughput/total_tokens=757,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3948/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=758,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3949/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=758,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3950/500000] + train/ActionL1Loss=0.0606 + throughput/total_tokens=758,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3951/500000] + train/ActionL1Loss=0.0694 + throughput/total_tokens=758,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3952/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=758,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3953/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=758,976,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3954/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=759,168,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=3955/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=759,360,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=3956/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=759,552,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=3957/500000] + train/ActionL1Loss=0.0574 + throughput/total_tokens=759,744,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3958/500000] + train/ActionL1Loss=0.0728 + throughput/total_tokens=759,936,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3959/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=760,128,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3960/500000] + optim/total_grad_norm=9.501 + train/ActionL1Loss=0.0763 + throughput/total_tokens=760,320,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=3961/500000] + train/ActionL1Loss=0.0646 + throughput/total_tokens=760,512,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3962/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=760,704,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3963/500000] + train/ActionL1Loss=0.0757 + throughput/total_tokens=760,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3964/500000] + train/ActionL1Loss=0.0625 + throughput/total_tokens=761,088,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=3965/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=761,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3966/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=761,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3967/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=761,664,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3968/500000] + train/ActionL1Loss=0.0623 + throughput/total_tokens=761,856,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3969/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=762,048,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=3970/500000] + train/ActionL1Loss=0.0574 + throughput/total_tokens=762,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3971/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=762,432,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3972/500000] + train/ActionL1Loss=0.0710 + throughput/total_tokens=762,624,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3973/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=762,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3974/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=763,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3975/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=763,200,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3976/500000] + train/ActionL1Loss=0.0640 + throughput/total_tokens=763,392,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3977/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=763,584,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3978/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=763,776,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3979/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=763,968,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3980/500000] + optim/total_grad_norm=9.196 + train/ActionL1Loss=0.0692 + throughput/total_tokens=764,160,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3981/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=764,352,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3982/500000] + train/ActionL1Loss=0.0657 + throughput/total_tokens=764,544,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3983/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=764,736,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3984/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=764,928,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3985/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=765,120,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=3986/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=765,312,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3987/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=765,504,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3988/500000] + train/ActionL1Loss=0.0588 + throughput/total_tokens=765,696,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3989/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=765,888,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=3990/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=766,080,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=3991/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=766,272,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3992/500000] + train/ActionL1Loss=0.0677 + throughput/total_tokens=766,464,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3993/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=766,656,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3994/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=766,848,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3995/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=767,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3996/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=767,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3997/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=767,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=3998/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=767,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=3999/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=767,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4000/500000] + optim/total_grad_norm=11.09 + train/ActionL1Loss=0.0706 + throughput/total_tokens=768,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +10/12 [15:53:50] INFO | >> Saving config... checkpoint.py:608 +10/12 [15:54:22] INFO | >> Saving model state... checkpoint.py:796 +10/12 [15:55:32] INFO | >> Saving optim state... checkpoint.py:811 +10/12 [15:57:04] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=4001/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=768,192,000 + throughput/device/tokens_per_second=1,210 + throughput/device/batches_per_second=0.0504 +[step=4002/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=768,384,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=4003/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=768,576,000 + throughput/device/tokens_per_second=1,136 + throughput/device/batches_per_second=0.0473 +[step=4004/500000] + train/ActionL1Loss=0.0664 + throughput/total_tokens=768,768,000 + throughput/device/tokens_per_second=1,142 + throughput/device/batches_per_second=0.0476 +[step=4005/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=768,960,000 + throughput/device/tokens_per_second=1,147 + throughput/device/batches_per_second=0.0478 +[step=4006/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=769,152,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=4007/500000] + train/ActionL1Loss=0.0675 + throughput/total_tokens=769,344,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4008/500000] + train/ActionL1Loss=0.0653 + throughput/total_tokens=769,536,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=4009/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=769,728,000 + throughput/device/tokens_per_second=1,162 + throughput/device/batches_per_second=0.0484 +[step=4010/500000] + train/ActionL1Loss=0.0845 + throughput/total_tokens=769,920,000 + throughput/device/tokens_per_second=1,164 + throughput/device/batches_per_second=0.0485 + System/Peak GPU Memory (MB)=46,924 +[step=4011/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=770,112,000 + throughput/device/tokens_per_second=1,165 + throughput/device/batches_per_second=0.0486 +[step=4012/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=770,304,000 + throughput/device/tokens_per_second=1,166 + throughput/device/batches_per_second=0.0486 +[step=4013/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=770,496,000 + throughput/device/tokens_per_second=1,167 + throughput/device/batches_per_second=0.0486 +[step=4014/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=770,688,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=4015/500000] + train/ActionL1Loss=0.0600 + throughput/total_tokens=770,880,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=4016/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=771,072,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=4017/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=771,264,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=4018/500000] + train/ActionL1Loss=0.0685 + throughput/total_tokens=771,456,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=4019/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=771,648,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=4020/500000] + optim/total_grad_norm=8.924 + train/ActionL1Loss=0.0501 + throughput/total_tokens=771,840,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 + System/Peak GPU Memory (MB)=46,924 +[step=4021/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=772,032,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=4022/500000] + train/ActionL1Loss=0.0630 + throughput/total_tokens=772,224,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4023/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=772,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4024/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=772,608,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4025/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=772,800,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4026/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=772,992,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4027/500000] + train/ActionL1Loss=0.0677 + throughput/total_tokens=773,184,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4028/500000] + train/ActionL1Loss=0.0678 + throughput/total_tokens=773,376,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4029/500000] + train/ActionL1Loss=0.0675 + throughput/total_tokens=773,568,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4030/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=773,760,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4031/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=773,952,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4032/500000] + train/ActionL1Loss=0.0641 + throughput/total_tokens=774,144,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=4033/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=774,336,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=4034/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=774,528,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4035/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=774,720,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4036/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=774,912,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4037/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=775,104,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4038/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=775,296,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4039/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=775,488,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4040/500000] + optim/total_grad_norm=10.00 + train/ActionL1Loss=0.0628 + throughput/total_tokens=775,680,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4041/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=775,872,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4042/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=776,064,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4043/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=776,256,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4044/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=776,448,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4045/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=776,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4046/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=776,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4047/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=777,024,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4048/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=777,216,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4049/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=777,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4050/500000] + train/ActionL1Loss=0.0699 + throughput/total_tokens=777,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4051/500000] + train/ActionL1Loss=0.0574 + throughput/total_tokens=777,792,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4052/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=777,984,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4053/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=778,176,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4054/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=778,368,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4055/500000] + train/ActionL1Loss=0.0672 + throughput/total_tokens=778,560,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4056/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=778,752,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=4057/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=778,944,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4058/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=779,136,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4059/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=779,328,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4060/500000] + optim/total_grad_norm=8.662 + train/ActionL1Loss=0.0531 + throughput/total_tokens=779,520,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=4061/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=779,712,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4062/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=779,904,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4063/500000] + train/ActionL1Loss=0.0627 + throughput/total_tokens=780,096,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4064/500000] + train/ActionL1Loss=0.0717 + throughput/total_tokens=780,288,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4065/500000] + train/ActionL1Loss=0.0657 + throughput/total_tokens=780,480,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4066/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=780,672,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4067/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=780,864,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4068/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=781,056,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=4069/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=781,248,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4070/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=781,440,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=4071/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=781,632,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4072/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=781,824,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4073/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=782,016,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4074/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=782,208,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4075/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=782,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4076/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=782,592,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4077/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=782,784,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4078/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=782,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4079/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=783,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4080/500000] + optim/total_grad_norm=10.68 + train/ActionL1Loss=0.0662 + throughput/total_tokens=783,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4081/500000] + train/ActionL1Loss=0.0684 + throughput/total_tokens=783,552,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4082/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=783,744,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4083/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=783,936,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4084/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=784,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4085/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=784,320,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4086/500000] + train/ActionL1Loss=0.0616 + throughput/total_tokens=784,512,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4087/500000] + train/ActionL1Loss=0.0768 + throughput/total_tokens=784,704,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4088/500000] + train/ActionL1Loss=0.0689 + throughput/total_tokens=784,896,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4089/500000] + train/ActionL1Loss=0.0703 + throughput/total_tokens=785,088,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4090/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=785,280,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4091/500000] + train/ActionL1Loss=0.0685 + throughput/total_tokens=785,472,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4092/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=785,664,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4093/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=785,856,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4094/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=786,048,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4095/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=786,240,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4096/500000] + train/ActionL1Loss=0.0651 + throughput/total_tokens=786,432,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4097/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=786,624,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=4098/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=786,816,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4099/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=787,008,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4100/500000] + optim/total_grad_norm=9.425 + train/ActionL1Loss=0.0634 + throughput/total_tokens=787,200,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4101/500000] + train/ActionL1Loss=0.0587 + throughput/total_tokens=787,392,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4102/500000] + train/ActionL1Loss=0.0584 + throughput/total_tokens=787,584,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4103/500000] + train/ActionL1Loss=0.0697 + throughput/total_tokens=787,776,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4104/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=787,968,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4105/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=788,160,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4106/500000] + train/ActionL1Loss=0.0588 + throughput/total_tokens=788,352,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4107/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=788,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4108/500000] + train/ActionL1Loss=0.0621 + throughput/total_tokens=788,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4109/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=788,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4110/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=789,120,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=4111/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=789,312,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4112/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=789,504,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4113/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=789,696,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4114/500000] + train/ActionL1Loss=0.0731 + throughput/total_tokens=789,888,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4115/500000] + train/ActionL1Loss=0.0681 + throughput/total_tokens=790,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4116/500000] + train/ActionL1Loss=0.0645 + throughput/total_tokens=790,272,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4117/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=790,464,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4118/500000] + train/ActionL1Loss=0.0587 + throughput/total_tokens=790,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4119/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=790,848,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4120/500000] + optim/total_grad_norm=9.993 + train/ActionL1Loss=0.0438 + throughput/total_tokens=791,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4121/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=791,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4122/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=791,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4123/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=791,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4124/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=791,808,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4125/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=792,000,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4126/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=792,192,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4127/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=792,384,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4128/500000] + train/ActionL1Loss=0.0607 + throughput/total_tokens=792,576,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4129/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=792,768,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4130/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=792,960,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4131/500000] + train/ActionL1Loss=0.0683 + throughput/total_tokens=793,152,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4132/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=793,344,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4133/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=793,536,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4134/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=793,728,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4135/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=793,920,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4136/500000] + train/ActionL1Loss=0.0640 + throughput/total_tokens=794,112,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4137/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=794,304,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4138/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=794,496,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4139/500000] + train/ActionL1Loss=0.0618 + throughput/total_tokens=794,688,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4140/500000] + optim/total_grad_norm=7.776 + train/ActionL1Loss=0.0635 + throughput/total_tokens=794,880,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4141/500000] + train/ActionL1Loss=0.0754 + throughput/total_tokens=795,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4142/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=795,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4143/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=795,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4144/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=795,648,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4145/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=795,840,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4146/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=796,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4147/500000] + train/ActionL1Loss=0.0719 + throughput/total_tokens=796,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4148/500000] + train/ActionL1Loss=0.0659 + throughput/total_tokens=796,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4149/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=796,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4150/500000] + train/ActionL1Loss=0.0673 + throughput/total_tokens=796,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4151/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=796,992,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4152/500000] + train/ActionL1Loss=0.0618 + throughput/total_tokens=797,184,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4153/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=797,376,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4154/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=797,568,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4155/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=797,760,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4156/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=797,952,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4157/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=798,144,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4158/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=798,336,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4159/500000] + train/ActionL1Loss=0.0714 + throughput/total_tokens=798,528,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4160/500000] + optim/total_grad_norm=9.103 + train/ActionL1Loss=0.0584 + throughput/total_tokens=798,720,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4161/500000] + train/ActionL1Loss=0.0390 + throughput/total_tokens=798,912,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4162/500000] + train/ActionL1Loss=0.0355 + throughput/total_tokens=799,104,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4163/500000] + train/ActionL1Loss=0.0712 + throughput/total_tokens=799,296,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4164/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=799,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4165/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=799,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4166/500000] + train/ActionL1Loss=0.0663 + throughput/total_tokens=799,872,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4167/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=800,064,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4168/500000] + train/ActionL1Loss=0.0726 + throughput/total_tokens=800,256,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4169/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=800,448,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4170/500000] + train/ActionL1Loss=0.0607 + throughput/total_tokens=800,640,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4171/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=800,832,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4172/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=801,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4173/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=801,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4174/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=801,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4175/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=801,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4176/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=801,792,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4177/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=801,984,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4178/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=802,176,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4179/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=802,368,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4180/500000] + optim/total_grad_norm=5.622 + train/ActionL1Loss=0.0513 + throughput/total_tokens=802,560,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4181/500000] + train/ActionL1Loss=0.0705 + throughput/total_tokens=802,752,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4182/500000] + train/ActionL1Loss=0.0635 + throughput/total_tokens=802,944,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4183/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=803,136,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4184/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=803,328,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4185/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=803,520,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4186/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=803,712,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4187/500000] + train/ActionL1Loss=0.0719 + throughput/total_tokens=803,904,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4188/500000] + train/ActionL1Loss=0.0758 + throughput/total_tokens=804,096,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4189/500000] + train/ActionL1Loss=0.0646 + throughput/total_tokens=804,288,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4190/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=804,480,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4191/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=804,672,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4192/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=804,864,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4193/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=805,056,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4194/500000] + train/ActionL1Loss=0.0607 + throughput/total_tokens=805,248,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4195/500000] + train/ActionL1Loss=0.0761 + throughput/total_tokens=805,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4196/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=805,632,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4197/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=805,824,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4198/500000] + train/ActionL1Loss=0.0688 + throughput/total_tokens=806,016,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4199/500000] + train/ActionL1Loss=0.0837 + throughput/total_tokens=806,208,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4200/500000] + optim/total_grad_norm=8.971 + train/ActionL1Loss=0.0721 + throughput/total_tokens=806,400,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4201/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=806,592,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4202/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=806,784,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4203/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=806,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4204/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=807,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4205/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=807,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4206/500000] + train/ActionL1Loss=0.0562 + throughput/total_tokens=807,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4207/500000] + train/ActionL1Loss=0.0644 + throughput/total_tokens=807,744,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4208/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=807,936,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4209/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=808,128,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4210/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=808,320,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4211/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=808,512,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4212/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=808,704,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4213/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=808,896,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4214/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=809,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4215/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=809,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4216/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=809,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4217/500000] + train/ActionL1Loss=0.0760 + throughput/total_tokens=809,664,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4218/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=809,856,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4219/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=810,048,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4220/500000] + optim/total_grad_norm=7.849 + train/ActionL1Loss=0.0477 + throughput/total_tokens=810,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4221/500000] + train/ActionL1Loss=0.0639 + throughput/total_tokens=810,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4222/500000] + train/ActionL1Loss=0.0656 + throughput/total_tokens=810,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4223/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=810,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4224/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=811,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4225/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=811,200,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4226/500000] + train/ActionL1Loss=0.0691 + throughput/total_tokens=811,392,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4227/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=811,584,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4228/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=811,776,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4229/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=811,968,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4230/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=812,160,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4231/500000] + train/ActionL1Loss=0.0626 + throughput/total_tokens=812,352,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4232/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=812,544,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4233/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=812,736,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4234/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=812,928,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4235/500000] + train/ActionL1Loss=0.0628 + throughput/total_tokens=813,120,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4236/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=813,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4237/500000] + train/ActionL1Loss=0.0629 + throughput/total_tokens=813,504,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4238/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=813,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4239/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=813,888,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4240/500000] + optim/total_grad_norm=8.670 + train/ActionL1Loss=0.0507 + throughput/total_tokens=814,080,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4241/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=814,272,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4242/500000] + train/ActionL1Loss=0.0744 + throughput/total_tokens=814,464,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4243/500000] + train/ActionL1Loss=0.0372 + throughput/total_tokens=814,656,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4244/500000] + train/ActionL1Loss=0.0688 + throughput/total_tokens=814,848,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4245/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=815,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4246/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=815,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4247/500000] + train/ActionL1Loss=0.0739 + throughput/total_tokens=815,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4248/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=815,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4249/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=815,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4250/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=816,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4251/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=816,192,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4252/500000] + train/ActionL1Loss=0.0758 + throughput/total_tokens=816,384,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4253/500000] + train/ActionL1Loss=0.0624 + throughput/total_tokens=816,576,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4254/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=816,768,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4255/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=816,960,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4256/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=817,152,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4257/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=817,344,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4258/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=817,536,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4259/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=817,728,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4260/500000] + optim/total_grad_norm=8.746 + train/ActionL1Loss=0.0506 + throughput/total_tokens=817,920,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=4261/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=818,112,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4262/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=818,304,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4263/500000] + train/ActionL1Loss=0.0625 + throughput/total_tokens=818,496,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4264/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=818,688,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4265/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=818,880,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=4266/500000] + train/ActionL1Loss=0.0668 + throughput/total_tokens=819,072,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4267/500000] + train/ActionL1Loss=0.0724 + throughput/total_tokens=819,264,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4268/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=819,456,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4269/500000] + train/ActionL1Loss=0.0562 + throughput/total_tokens=819,648,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4270/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=819,840,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4271/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=820,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4272/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=820,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4273/500000] + train/ActionL1Loss=0.0705 + throughput/total_tokens=820,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4274/500000] + train/ActionL1Loss=0.0622 + throughput/total_tokens=820,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4275/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=820,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4276/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=820,992,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4277/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=821,184,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4278/500000] + train/ActionL1Loss=0.0640 + throughput/total_tokens=821,376,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4279/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=821,568,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4280/500000] + optim/total_grad_norm=7.290 + train/ActionL1Loss=0.0511 + throughput/total_tokens=821,760,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4281/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=821,952,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4282/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=822,144,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4283/500000] + train/ActionL1Loss=0.0721 + throughput/total_tokens=822,336,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4284/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=822,528,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4285/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=822,720,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4286/500000] + train/ActionL1Loss=0.0616 + throughput/total_tokens=822,912,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4287/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=823,104,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4288/500000] + train/ActionL1Loss=0.0676 + throughput/total_tokens=823,296,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4289/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=823,488,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4290/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=823,680,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4291/500000] + train/ActionL1Loss=0.0817 + throughput/total_tokens=823,872,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4292/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=824,064,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4293/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=824,256,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4294/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=824,448,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4295/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=824,640,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4296/500000] + train/ActionL1Loss=0.0679 + throughput/total_tokens=824,832,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4297/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=825,024,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4298/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=825,216,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4299/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=825,408,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4300/500000] + optim/total_grad_norm=8.847 + train/ActionL1Loss=0.0655 + throughput/total_tokens=825,600,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4301/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=825,792,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4302/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=825,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4303/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=826,176,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4304/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=826,368,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4305/500000] + train/ActionL1Loss=0.0335 + throughput/total_tokens=826,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4306/500000] + train/ActionL1Loss=0.0679 + throughput/total_tokens=826,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4307/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=826,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4308/500000] + train/ActionL1Loss=0.0673 + throughput/total_tokens=827,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4309/500000] + train/ActionL1Loss=0.0657 + throughput/total_tokens=827,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4310/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=827,520,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=4311/500000] + train/ActionL1Loss=0.0632 + throughput/total_tokens=827,712,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4312/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=827,904,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4313/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=828,096,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4314/500000] + train/ActionL1Loss=0.0687 + throughput/total_tokens=828,288,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4315/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=828,480,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4316/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=828,672,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4317/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=828,864,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4318/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=829,056,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4319/500000] + train/ActionL1Loss=0.0671 + throughput/total_tokens=829,248,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4320/500000] + optim/total_grad_norm=7.213 + train/ActionL1Loss=0.0550 + throughput/total_tokens=829,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4321/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=829,632,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4322/500000] + train/ActionL1Loss=0.0653 + throughput/total_tokens=829,824,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4323/500000] + train/ActionL1Loss=0.0699 + throughput/total_tokens=830,016,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4324/500000] + train/ActionL1Loss=0.0723 + throughput/total_tokens=830,208,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4325/500000] + train/ActionL1Loss=0.0587 + throughput/total_tokens=830,400,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4326/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=830,592,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4327/500000] + train/ActionL1Loss=0.0574 + throughput/total_tokens=830,784,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4328/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=830,976,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4329/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=831,168,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4330/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=831,360,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4331/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=831,552,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4332/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=831,744,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4333/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=831,936,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4334/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=832,128,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4335/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=832,320,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4336/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=832,512,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4337/500000] + train/ActionL1Loss=0.0601 + throughput/total_tokens=832,704,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4338/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=832,896,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4339/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=833,088,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4340/500000] + optim/total_grad_norm=8.192 + train/ActionL1Loss=0.0615 + throughput/total_tokens=833,280,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4341/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=833,472,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4342/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=833,664,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4343/500000] + train/ActionL1Loss=0.0694 + throughput/total_tokens=833,856,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4344/500000] + train/ActionL1Loss=0.0368 + throughput/total_tokens=834,048,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4345/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=834,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4346/500000] + train/ActionL1Loss=0.0666 + throughput/total_tokens=834,432,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4347/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=834,624,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4348/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=834,816,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4349/500000] + train/ActionL1Loss=0.0673 + throughput/total_tokens=835,008,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4350/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=835,200,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4351/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=835,392,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4352/500000] + train/ActionL1Loss=0.0689 + throughput/total_tokens=835,584,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4353/500000] + train/ActionL1Loss=0.0294 + throughput/total_tokens=835,776,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4354/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=835,968,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4355/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=836,160,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4356/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=836,352,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4357/500000] + train/ActionL1Loss=0.0622 + throughput/total_tokens=836,544,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4358/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=836,736,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4359/500000] + train/ActionL1Loss=0.0677 + throughput/total_tokens=836,928,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4360/500000] + optim/total_grad_norm=8.140 + train/ActionL1Loss=0.0444 + throughput/total_tokens=837,120,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=4361/500000] + train/ActionL1Loss=0.0716 + throughput/total_tokens=837,312,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4362/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=837,504,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4363/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=837,696,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4364/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=837,888,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4365/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=838,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4366/500000] + train/ActionL1Loss=0.0681 + throughput/total_tokens=838,272,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4367/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=838,464,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4368/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=838,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4369/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=838,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4370/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=839,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4371/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=839,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4372/500000] + train/ActionL1Loss=0.0679 + throughput/total_tokens=839,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4373/500000] + train/ActionL1Loss=0.0631 + throughput/total_tokens=839,616,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4374/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=839,808,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4375/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=840,000,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4376/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=840,192,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4377/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=840,384,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4378/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=840,576,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4379/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=840,768,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4380/500000] + optim/total_grad_norm=9.558 + train/ActionL1Loss=0.0466 + throughput/total_tokens=840,960,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4381/500000] + train/ActionL1Loss=0.0721 + throughput/total_tokens=841,152,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4382/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=841,344,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4383/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=841,536,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4384/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=841,728,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4385/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=841,920,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4386/500000] + train/ActionL1Loss=0.0663 + throughput/total_tokens=842,112,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4387/500000] + train/ActionL1Loss=0.0574 + throughput/total_tokens=842,304,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4388/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=842,496,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4389/500000] + train/ActionL1Loss=0.0588 + throughput/total_tokens=842,688,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4390/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=842,880,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4391/500000] + train/ActionL1Loss=0.0682 + throughput/total_tokens=843,072,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4392/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=843,264,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4393/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=843,456,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4394/500000] + train/ActionL1Loss=0.0658 + throughput/total_tokens=843,648,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4395/500000] + train/ActionL1Loss=0.0749 + throughput/total_tokens=843,840,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4396/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=844,032,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4397/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=844,224,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=4398/500000] + train/ActionL1Loss=0.0796 + throughput/total_tokens=844,416,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=4399/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=844,608,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=4400/500000] + optim/total_grad_norm=7.507 + train/ActionL1Loss=0.0721 + throughput/total_tokens=844,800,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=4401/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=844,992,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4402/500000] + train/ActionL1Loss=0.0625 + throughput/total_tokens=845,184,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4403/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=845,376,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4404/500000] + train/ActionL1Loss=0.0639 + throughput/total_tokens=845,568,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4405/500000] + train/ActionL1Loss=0.0616 + throughput/total_tokens=845,760,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4406/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=845,952,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4407/500000] + train/ActionL1Loss=0.0730 + throughput/total_tokens=846,144,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4408/500000] + train/ActionL1Loss=0.0666 + throughput/total_tokens=846,336,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4409/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=846,528,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4410/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=846,720,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4411/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=846,912,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4412/500000] + train/ActionL1Loss=0.0631 + throughput/total_tokens=847,104,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4413/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=847,296,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4414/500000] + train/ActionL1Loss=0.0664 + throughput/total_tokens=847,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4415/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=847,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4416/500000] + train/ActionL1Loss=0.0616 + throughput/total_tokens=847,872,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4417/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=848,064,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4418/500000] + train/ActionL1Loss=0.0668 + throughput/total_tokens=848,256,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4419/500000] + train/ActionL1Loss=0.0624 + throughput/total_tokens=848,448,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4420/500000] + optim/total_grad_norm=8.697 + train/ActionL1Loss=0.0645 + throughput/total_tokens=848,640,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4421/500000] + train/ActionL1Loss=0.0734 + throughput/total_tokens=848,832,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4422/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=849,024,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4423/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=849,216,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=4424/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=849,408,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=4425/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=849,600,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=4426/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=849,792,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=4427/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=849,984,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4428/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=850,176,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4429/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=850,368,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4430/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=850,560,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4431/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=850,752,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4432/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=850,944,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4433/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=851,136,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4434/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=851,328,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4435/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=851,520,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4436/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=851,712,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4437/500000] + train/ActionL1Loss=0.0353 + throughput/total_tokens=851,904,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4438/500000] + train/ActionL1Loss=0.0616 + throughput/total_tokens=852,096,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4439/500000] + train/ActionL1Loss=0.0675 + throughput/total_tokens=852,288,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4440/500000] + optim/total_grad_norm=7.593 + train/ActionL1Loss=0.0522 + throughput/total_tokens=852,480,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4441/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=852,672,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4442/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=852,864,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4443/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=853,056,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4444/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=853,248,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4445/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=853,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4446/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=853,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4447/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=853,824,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4448/500000] + train/ActionL1Loss=0.0584 + throughput/total_tokens=854,016,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4449/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=854,208,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4450/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=854,400,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=4451/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=854,592,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4452/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=854,784,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4453/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=854,976,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4454/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=855,168,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4455/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=855,360,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4456/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=855,552,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4457/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=855,744,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4458/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=855,936,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4459/500000] + train/ActionL1Loss=0.0606 + throughput/total_tokens=856,128,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4460/500000] + optim/total_grad_norm=8.913 + train/ActionL1Loss=0.0322 + throughput/total_tokens=856,320,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=4461/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=856,512,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4462/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=856,704,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4463/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=856,896,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4464/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=857,088,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4465/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=857,280,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4466/500000] + train/ActionL1Loss=0.0627 + throughput/total_tokens=857,472,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4467/500000] + train/ActionL1Loss=0.0359 + throughput/total_tokens=857,664,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4468/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=857,856,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4469/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=858,048,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4470/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=858,240,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=4471/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=858,432,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4472/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=858,624,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4473/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=858,816,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4474/500000] + train/ActionL1Loss=0.0697 + throughput/total_tokens=859,008,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4475/500000] + train/ActionL1Loss=0.0617 + throughput/total_tokens=859,200,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4476/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=859,392,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4477/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=859,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4478/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=859,776,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4479/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=859,968,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4480/500000] + optim/total_grad_norm=9.765 + train/ActionL1Loss=0.0603 + throughput/total_tokens=860,160,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4481/500000] + train/ActionL1Loss=0.0584 + throughput/total_tokens=860,352,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4482/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=860,544,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4483/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=860,736,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4484/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=860,928,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4485/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=861,120,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4486/500000] + train/ActionL1Loss=0.0685 + throughput/total_tokens=861,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4487/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=861,504,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4488/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=861,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4489/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=861,888,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4490/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=862,080,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4491/500000] + train/ActionL1Loss=0.0640 + throughput/total_tokens=862,272,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4492/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=862,464,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4493/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=862,656,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4494/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=862,848,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4495/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=863,040,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4496/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=863,232,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4497/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=863,424,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4498/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=863,616,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4499/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=863,808,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4500/500000] + optim/total_grad_norm=9.716 + train/ActionL1Loss=0.0619 + throughput/total_tokens=864,000,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +10/12 [18:48:32] INFO | >> Saving config... checkpoint.py:608 +10/12 [18:49:04] INFO | >> Saving model state... checkpoint.py:796 +10/12 [18:50:17] INFO | >> Saving optim state... checkpoint.py:811 +10/12 [18:51:50] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=4501/500000] + train/ActionL1Loss=0.0619 + throughput/total_tokens=864,192,000 + throughput/device/tokens_per_second=1,210 + throughput/device/batches_per_second=0.0504 +[step=4502/500000] + train/ActionL1Loss=0.0600 + throughput/total_tokens=864,384,000 + throughput/device/tokens_per_second=1,166 + throughput/device/batches_per_second=0.0486 +[step=4503/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=864,576,000 + throughput/device/tokens_per_second=1,145 + throughput/device/batches_per_second=0.0477 +[step=4504/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=864,768,000 + throughput/device/tokens_per_second=1,150 + throughput/device/batches_per_second=0.0479 +[step=4505/500000] + train/ActionL1Loss=0.0731 + throughput/total_tokens=864,960,000 + throughput/device/tokens_per_second=1,158 + throughput/device/batches_per_second=0.0483 +[step=4506/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=865,152,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=4507/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=865,344,000 + throughput/device/tokens_per_second=1,163 + throughput/device/batches_per_second=0.0485 +[step=4508/500000] + train/ActionL1Loss=0.0626 + throughput/total_tokens=865,536,000 + throughput/device/tokens_per_second=1,166 + throughput/device/batches_per_second=0.0486 +[step=4509/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=865,728,000 + throughput/device/tokens_per_second=1,167 + throughput/device/batches_per_second=0.0487 +[step=4510/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=865,920,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 + System/Peak GPU Memory (MB)=46,924 +[step=4511/500000] + train/ActionL1Loss=0.0669 + throughput/total_tokens=866,112,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=4512/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=866,304,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=4513/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=866,496,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=4514/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=866,688,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=4515/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=866,880,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=4516/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=867,072,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=4517/500000] + train/ActionL1Loss=0.0745 + throughput/total_tokens=867,264,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=4518/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=867,456,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=4519/500000] + train/ActionL1Loss=0.0699 + throughput/total_tokens=867,648,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=4520/500000] + optim/total_grad_norm=8.242 + train/ActionL1Loss=0.0570 + throughput/total_tokens=867,840,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 + System/Peak GPU Memory (MB)=46,924 +[step=4521/500000] + train/ActionL1Loss=0.0673 + throughput/total_tokens=868,032,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=4522/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=868,224,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=4523/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=868,416,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4524/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=868,608,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4525/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=868,800,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4526/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=868,992,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4527/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=869,184,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4528/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=869,376,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4529/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=869,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4530/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=869,760,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=4531/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=869,952,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4532/500000] + train/ActionL1Loss=0.0634 + throughput/total_tokens=870,144,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4533/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=870,336,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4534/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=870,528,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4535/500000] + train/ActionL1Loss=0.0587 + throughput/total_tokens=870,720,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4536/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=870,912,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4537/500000] + train/ActionL1Loss=0.0677 + throughput/total_tokens=871,104,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4538/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=871,296,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4539/500000] + train/ActionL1Loss=0.0709 + throughput/total_tokens=871,488,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4540/500000] + optim/total_grad_norm=9.218 + train/ActionL1Loss=0.0592 + throughput/total_tokens=871,680,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4541/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=871,872,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4542/500000] + train/ActionL1Loss=0.0634 + throughput/total_tokens=872,064,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4543/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=872,256,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4544/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=872,448,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4545/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=872,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4546/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=872,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4547/500000] + train/ActionL1Loss=0.0690 + throughput/total_tokens=873,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4548/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=873,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4549/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=873,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4550/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=873,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4551/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=873,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4552/500000] + train/ActionL1Loss=0.0690 + throughput/total_tokens=873,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4553/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=874,176,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4554/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=874,368,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4555/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=874,560,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4556/500000] + train/ActionL1Loss=0.0638 + throughput/total_tokens=874,752,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4557/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=874,944,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4558/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=875,136,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4559/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=875,328,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4560/500000] + optim/total_grad_norm=9.646 + train/ActionL1Loss=0.0604 + throughput/total_tokens=875,520,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4561/500000] + train/ActionL1Loss=0.0619 + throughput/total_tokens=875,712,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4562/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=875,904,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4563/500000] + train/ActionL1Loss=0.0641 + throughput/total_tokens=876,096,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4564/500000] + train/ActionL1Loss=0.0650 + throughput/total_tokens=876,288,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4565/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=876,480,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4566/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=876,672,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4567/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=876,864,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4568/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=877,056,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4569/500000] + train/ActionL1Loss=0.0710 + throughput/total_tokens=877,248,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4570/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=877,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4571/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=877,632,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4572/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=877,824,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4573/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=878,016,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4574/500000] + train/ActionL1Loss=0.0661 + throughput/total_tokens=878,208,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4575/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=878,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4576/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=878,592,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4577/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=878,784,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4578/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=878,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4579/500000] + train/ActionL1Loss=0.0690 + throughput/total_tokens=879,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4580/500000] + optim/total_grad_norm=7.260 + train/ActionL1Loss=0.0580 + throughput/total_tokens=879,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4581/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=879,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4582/500000] + train/ActionL1Loss=0.0634 + throughput/total_tokens=879,744,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4583/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=879,936,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4584/500000] + train/ActionL1Loss=0.0743 + throughput/total_tokens=880,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4585/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=880,320,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4586/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=880,512,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4587/500000] + train/ActionL1Loss=0.0661 + throughput/total_tokens=880,704,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4588/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=880,896,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4589/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=881,088,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4590/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=881,280,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4591/500000] + train/ActionL1Loss=0.0666 + throughput/total_tokens=881,472,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4592/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=881,664,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4593/500000] + train/ActionL1Loss=0.0673 + throughput/total_tokens=881,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4594/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=882,048,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4595/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=882,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4596/500000] + train/ActionL1Loss=0.0700 + throughput/total_tokens=882,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4597/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=882,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4598/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=882,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4599/500000] + train/ActionL1Loss=0.0635 + throughput/total_tokens=883,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4600/500000] + optim/total_grad_norm=9.936 + train/ActionL1Loss=0.0597 + throughput/total_tokens=883,200,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4601/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=883,392,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4602/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=883,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4603/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=883,776,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4604/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=883,968,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4605/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=884,160,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=4606/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=884,352,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4607/500000] + train/ActionL1Loss=0.0324 + throughput/total_tokens=884,544,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=4608/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=884,736,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=4609/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=884,928,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=4610/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=885,120,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 + System/Peak GPU Memory (MB)=46,924 +[step=4611/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=885,312,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=4612/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=885,504,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=4613/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=885,696,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4614/500000] + train/ActionL1Loss=0.0720 + throughput/total_tokens=885,888,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4615/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=886,080,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4616/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=886,272,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4617/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=886,464,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4618/500000] + train/ActionL1Loss=0.0693 + throughput/total_tokens=886,656,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4619/500000] + train/ActionL1Loss=0.0601 + throughput/total_tokens=886,848,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4620/500000] + optim/total_grad_norm=10.22 + train/ActionL1Loss=0.0671 + throughput/total_tokens=887,040,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4621/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=887,232,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4622/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=887,424,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4623/500000] + train/ActionL1Loss=0.0619 + throughput/total_tokens=887,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4624/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=887,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4625/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=888,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4626/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=888,192,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4627/500000] + train/ActionL1Loss=0.0639 + throughput/total_tokens=888,384,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4628/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=888,576,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4629/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=888,768,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4630/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=888,960,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4631/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=889,152,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4632/500000] + train/ActionL1Loss=0.0700 + throughput/total_tokens=889,344,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4633/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=889,536,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4634/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=889,728,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4635/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=889,920,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4636/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=890,112,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4637/500000] + train/ActionL1Loss=0.0631 + throughput/total_tokens=890,304,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4638/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=890,496,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4639/500000] + train/ActionL1Loss=0.0689 + throughput/total_tokens=890,688,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4640/500000] + optim/total_grad_norm=8.959 + train/ActionL1Loss=0.0422 + throughput/total_tokens=890,880,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4641/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=891,072,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4642/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=891,264,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4643/500000] + train/ActionL1Loss=0.0338 + throughput/total_tokens=891,456,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4644/500000] + train/ActionL1Loss=0.0717 + throughput/total_tokens=891,648,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4645/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=891,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4646/500000] + train/ActionL1Loss=0.0558 + throughput/total_tokens=892,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4647/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=892,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4648/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=892,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4649/500000] + train/ActionL1Loss=0.0562 + throughput/total_tokens=892,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4650/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=892,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4651/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=892,992,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4652/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=893,184,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4653/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=893,376,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4654/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=893,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4655/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=893,760,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4656/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=893,952,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4657/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=894,144,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4658/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=894,336,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4659/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=894,528,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4660/500000] + optim/total_grad_norm=9.285 + train/ActionL1Loss=0.0358 + throughput/total_tokens=894,720,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=4661/500000] + train/ActionL1Loss=0.0311 + throughput/total_tokens=894,912,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4662/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=895,104,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4663/500000] + train/ActionL1Loss=0.0630 + throughput/total_tokens=895,296,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4664/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=895,488,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4665/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=895,680,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4666/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=895,872,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4667/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=896,064,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4668/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=896,256,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4669/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=896,448,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=4670/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=896,640,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=4671/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=896,832,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4672/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=897,024,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=4673/500000] + train/ActionL1Loss=0.0337 + throughput/total_tokens=897,216,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4674/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=897,408,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4675/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=897,600,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4676/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=897,792,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=4677/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=897,984,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=4678/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=898,176,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4679/500000] + train/ActionL1Loss=0.0293 + throughput/total_tokens=898,368,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4680/500000] + optim/total_grad_norm=9.755 + train/ActionL1Loss=0.0373 + throughput/total_tokens=898,560,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=4681/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=898,752,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=4682/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=898,944,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4683/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=899,136,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4684/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=899,328,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=4685/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=899,520,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=4686/500000] + train/ActionL1Loss=0.0584 + throughput/total_tokens=899,712,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4687/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=899,904,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=4688/500000] + train/ActionL1Loss=0.0585 + throughput/total_tokens=900,096,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4689/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=900,288,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4690/500000] + train/ActionL1Loss=0.0584 + throughput/total_tokens=900,480,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=4691/500000] + train/ActionL1Loss=0.0639 + throughput/total_tokens=900,672,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4692/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=900,864,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4693/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=901,056,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4694/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=901,248,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4695/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=901,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4696/500000] + train/ActionL1Loss=0.0615 + throughput/total_tokens=901,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4697/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=901,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4698/500000] + train/ActionL1Loss=0.0685 + throughput/total_tokens=902,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4699/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=902,208,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4700/500000] + optim/total_grad_norm=8.931 + train/ActionL1Loss=0.0592 + throughput/total_tokens=902,400,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4701/500000] + train/ActionL1Loss=0.0721 + throughput/total_tokens=902,592,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4702/500000] + train/ActionL1Loss=0.0588 + throughput/total_tokens=902,784,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4703/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=902,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4704/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=903,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4705/500000] + train/ActionL1Loss=0.0682 + throughput/total_tokens=903,360,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4706/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=903,552,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4707/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=903,744,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4708/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=903,936,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4709/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=904,128,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4710/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=904,320,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4711/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=904,512,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4712/500000] + train/ActionL1Loss=0.0626 + throughput/total_tokens=904,704,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4713/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=904,896,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4714/500000] + train/ActionL1Loss=0.0737 + throughput/total_tokens=905,088,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4715/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=905,280,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4716/500000] + train/ActionL1Loss=0.0674 + throughput/total_tokens=905,472,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4717/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=905,664,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4718/500000] + train/ActionL1Loss=0.0627 + throughput/total_tokens=905,856,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4719/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=906,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4720/500000] + optim/total_grad_norm=9.887 + train/ActionL1Loss=0.0493 + throughput/total_tokens=906,240,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4721/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=906,432,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4722/500000] + train/ActionL1Loss=0.0678 + throughput/total_tokens=906,624,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4723/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=906,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4724/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=907,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4725/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=907,200,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4726/500000] + train/ActionL1Loss=0.0703 + throughput/total_tokens=907,392,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4727/500000] + train/ActionL1Loss=0.0368 + throughput/total_tokens=907,584,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4728/500000] + train/ActionL1Loss=0.0750 + throughput/total_tokens=907,776,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4729/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=907,968,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4730/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=908,160,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4731/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=908,352,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4732/500000] + train/ActionL1Loss=0.0622 + throughput/total_tokens=908,544,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4733/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=908,736,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4734/500000] + train/ActionL1Loss=0.0635 + throughput/total_tokens=908,928,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4735/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=909,120,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4736/500000] + train/ActionL1Loss=0.0335 + throughput/total_tokens=909,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4737/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=909,504,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4738/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=909,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4739/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=909,888,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4740/500000] + optim/total_grad_norm=7.140 + train/ActionL1Loss=0.0518 + throughput/total_tokens=910,080,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4741/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=910,272,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4742/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=910,464,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4743/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=910,656,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4744/500000] + train/ActionL1Loss=0.0588 + throughput/total_tokens=910,848,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4745/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=911,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4746/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=911,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4747/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=911,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4748/500000] + train/ActionL1Loss=0.0617 + throughput/total_tokens=911,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4749/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=911,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4750/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=912,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4751/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=912,192,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4752/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=912,384,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4753/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=912,576,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4754/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=912,768,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4755/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=912,960,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4756/500000] + train/ActionL1Loss=0.0585 + throughput/total_tokens=913,152,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4757/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=913,344,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4758/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=913,536,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4759/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=913,728,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4760/500000] + optim/total_grad_norm=8.741 + train/ActionL1Loss=0.0526 + throughput/total_tokens=913,920,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=4761/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=914,112,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4762/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=914,304,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4763/500000] + train/ActionL1Loss=0.0688 + throughput/total_tokens=914,496,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4764/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=914,688,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4765/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=914,880,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4766/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=915,072,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4767/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=915,264,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4768/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=915,456,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4769/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=915,648,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4770/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=915,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4771/500000] + train/ActionL1Loss=0.0718 + throughput/total_tokens=916,032,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4772/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=916,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4773/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=916,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4774/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=916,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4775/500000] + train/ActionL1Loss=0.0759 + throughput/total_tokens=916,800,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4776/500000] + train/ActionL1Loss=0.0663 + throughput/total_tokens=916,992,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4777/500000] + train/ActionL1Loss=0.0687 + throughput/total_tokens=917,184,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4778/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=917,376,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4779/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=917,568,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4780/500000] + optim/total_grad_norm=8.764 + train/ActionL1Loss=0.0483 + throughput/total_tokens=917,760,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4781/500000] + train/ActionL1Loss=0.0622 + throughput/total_tokens=917,952,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4782/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=918,144,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4783/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=918,336,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4784/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=918,528,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4785/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=918,720,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4786/500000] + train/ActionL1Loss=0.0656 + throughput/total_tokens=918,912,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4787/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=919,104,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4788/500000] + train/ActionL1Loss=0.0623 + throughput/total_tokens=919,296,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4789/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=919,488,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4790/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=919,680,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4791/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=919,872,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4792/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=920,064,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4793/500000] + train/ActionL1Loss=0.0641 + throughput/total_tokens=920,256,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4794/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=920,448,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4795/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=920,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4796/500000] + train/ActionL1Loss=0.0722 + throughput/total_tokens=920,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4797/500000] + train/ActionL1Loss=0.0894 + throughput/total_tokens=921,024,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4798/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=921,216,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4799/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=921,408,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4800/500000] + optim/total_grad_norm=7.913 + train/ActionL1Loss=0.0507 + throughput/total_tokens=921,600,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4801/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=921,792,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4802/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=921,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4803/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=922,176,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4804/500000] + train/ActionL1Loss=0.0564 + throughput/total_tokens=922,368,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4805/500000] + train/ActionL1Loss=0.0615 + throughput/total_tokens=922,560,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4806/500000] + train/ActionL1Loss=0.0744 + throughput/total_tokens=922,752,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4807/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=922,944,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4808/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=923,136,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4809/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=923,328,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4810/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=923,520,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4811/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=923,712,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4812/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=923,904,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4813/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=924,096,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4814/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=924,288,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4815/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=924,480,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4816/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=924,672,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4817/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=924,864,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4818/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=925,056,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4819/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=925,248,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4820/500000] + optim/total_grad_norm=9.567 + train/ActionL1Loss=0.0550 + throughput/total_tokens=925,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4821/500000] + train/ActionL1Loss=0.0753 + throughput/total_tokens=925,632,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4822/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=925,824,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4823/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=926,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4824/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=926,208,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4825/500000] + train/ActionL1Loss=0.0643 + throughput/total_tokens=926,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4826/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=926,592,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4827/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=926,784,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4828/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=926,976,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4829/500000] + train/ActionL1Loss=0.0669 + throughput/total_tokens=927,168,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4830/500000] + train/ActionL1Loss=0.0677 + throughput/total_tokens=927,360,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4831/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=927,552,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4832/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=927,744,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4833/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=927,936,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4834/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=928,128,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4835/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=928,320,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4836/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=928,512,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4837/500000] + train/ActionL1Loss=0.0672 + throughput/total_tokens=928,704,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4838/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=928,896,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4839/500000] + train/ActionL1Loss=0.0587 + throughput/total_tokens=929,088,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4840/500000] + optim/total_grad_norm=8.757 + train/ActionL1Loss=0.0577 + throughput/total_tokens=929,280,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4841/500000] + train/ActionL1Loss=0.0676 + throughput/total_tokens=929,472,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4842/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=929,664,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4843/500000] + train/ActionL1Loss=0.0752 + throughput/total_tokens=929,856,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4844/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=930,048,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4845/500000] + train/ActionL1Loss=0.0600 + throughput/total_tokens=930,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4846/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=930,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4847/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=930,624,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4848/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=930,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4849/500000] + train/ActionL1Loss=0.0321 + throughput/total_tokens=931,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4850/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=931,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4851/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=931,392,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4852/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=931,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4853/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=931,776,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4854/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=931,968,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4855/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=932,160,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4856/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=932,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4857/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=932,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4858/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=932,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4859/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=932,928,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4860/500000] + optim/total_grad_norm=9.229 + train/ActionL1Loss=0.0699 + throughput/total_tokens=933,120,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=4861/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=933,312,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4862/500000] + train/ActionL1Loss=0.0709 + throughput/total_tokens=933,504,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4863/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=933,696,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4864/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=933,888,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4865/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=934,080,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4866/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=934,272,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4867/500000] + train/ActionL1Loss=0.0624 + throughput/total_tokens=934,464,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4868/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=934,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4869/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=934,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4870/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=935,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4871/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=935,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4872/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=935,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4873/500000] + train/ActionL1Loss=0.0680 + throughput/total_tokens=935,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4874/500000] + train/ActionL1Loss=0.0619 + throughput/total_tokens=935,808,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4875/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=936,000,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4876/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=936,192,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4877/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=936,384,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4878/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=936,576,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4879/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=936,768,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4880/500000] + optim/total_grad_norm=10.20 + train/ActionL1Loss=0.0611 + throughput/total_tokens=936,960,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4881/500000] + train/ActionL1Loss=0.0627 + throughput/total_tokens=937,152,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4882/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=937,344,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4883/500000] + train/ActionL1Loss=0.0650 + throughput/total_tokens=937,536,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4884/500000] + train/ActionL1Loss=0.0617 + throughput/total_tokens=937,728,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4885/500000] + train/ActionL1Loss=0.0663 + throughput/total_tokens=937,920,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4886/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=938,112,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4887/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=938,304,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4888/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=938,496,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4889/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=938,688,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4890/500000] + train/ActionL1Loss=0.0669 + throughput/total_tokens=938,880,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4891/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=939,072,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4892/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=939,264,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4893/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=939,456,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4894/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=939,648,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4895/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=939,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4896/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=940,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4897/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=940,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4898/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=940,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4899/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=940,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4900/500000] + optim/total_grad_norm=9.456 + train/ActionL1Loss=0.0692 + throughput/total_tokens=940,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=4901/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=940,992,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4902/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=941,184,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4903/500000] + train/ActionL1Loss=0.0618 + throughput/total_tokens=941,376,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4904/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=941,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4905/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=941,760,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4906/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=941,952,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4907/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=942,144,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4908/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=942,336,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4909/500000] + train/ActionL1Loss=0.0617 + throughput/total_tokens=942,528,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4910/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=942,720,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=4911/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=942,912,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4912/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=943,104,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4913/500000] + train/ActionL1Loss=0.0641 + throughput/total_tokens=943,296,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4914/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=943,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4915/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=943,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4916/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=943,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4917/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=944,064,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4918/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=944,256,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4919/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=944,448,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4920/500000] + optim/total_grad_norm=8.189 + train/ActionL1Loss=0.0419 + throughput/total_tokens=944,640,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4921/500000] + train/ActionL1Loss=0.0684 + throughput/total_tokens=944,832,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4922/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=945,024,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4923/500000] + train/ActionL1Loss=0.0373 + throughput/total_tokens=945,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4924/500000] + train/ActionL1Loss=0.0368 + throughput/total_tokens=945,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4925/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=945,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4926/500000] + train/ActionL1Loss=0.0723 + throughput/total_tokens=945,792,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4927/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=945,984,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4928/500000] + train/ActionL1Loss=0.0738 + throughput/total_tokens=946,176,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4929/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=946,368,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4930/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=946,560,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4931/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=946,752,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4932/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=946,944,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4933/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=947,136,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4934/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=947,328,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4935/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=947,520,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4936/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=947,712,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4937/500000] + train/ActionL1Loss=0.0766 + throughput/total_tokens=947,904,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4938/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=948,096,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4939/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=948,288,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4940/500000] + optim/total_grad_norm=9.520 + train/ActionL1Loss=0.0663 + throughput/total_tokens=948,480,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4941/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=948,672,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4942/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=948,864,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4943/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=949,056,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4944/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=949,248,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4945/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=949,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4946/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=949,632,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4947/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=949,824,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4948/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=950,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4949/500000] + train/ActionL1Loss=0.0631 + throughput/total_tokens=950,208,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4950/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=950,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4951/500000] + train/ActionL1Loss=0.0251 + throughput/total_tokens=950,592,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4952/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=950,784,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4953/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=950,976,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4954/500000] + train/ActionL1Loss=0.0631 + throughput/total_tokens=951,168,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=4955/500000] + train/ActionL1Loss=0.0738 + throughput/total_tokens=951,360,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4956/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=951,552,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4957/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=951,744,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4958/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=951,936,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4959/500000] + train/ActionL1Loss=0.0667 + throughput/total_tokens=952,128,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4960/500000] + optim/total_grad_norm=8.423 + train/ActionL1Loss=0.0530 + throughput/total_tokens=952,320,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=4961/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=952,512,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4962/500000] + train/ActionL1Loss=0.0693 + throughput/total_tokens=952,704,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4963/500000] + train/ActionL1Loss=0.0335 + throughput/total_tokens=952,896,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4964/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=953,088,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4965/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=953,280,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=4966/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=953,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=4967/500000] + train/ActionL1Loss=0.0628 + throughput/total_tokens=953,664,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4968/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=953,856,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4969/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=954,048,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=4970/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=954,240,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4971/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=954,432,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4972/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=954,624,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4973/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=954,816,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4974/500000] + train/ActionL1Loss=0.0574 + throughput/total_tokens=955,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4975/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=955,200,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4976/500000] + train/ActionL1Loss=0.0648 + throughput/total_tokens=955,392,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4977/500000] + train/ActionL1Loss=0.0750 + throughput/total_tokens=955,584,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=4978/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=955,776,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4979/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=955,968,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=4980/500000] + optim/total_grad_norm=9.720 + train/ActionL1Loss=0.0451 + throughput/total_tokens=956,160,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4981/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=956,352,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4982/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=956,544,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4983/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=956,736,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4984/500000] + train/ActionL1Loss=0.0369 + throughput/total_tokens=956,928,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4985/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=957,120,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=4986/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=957,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4987/500000] + train/ActionL1Loss=0.0585 + throughput/total_tokens=957,504,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4988/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=957,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4989/500000] + train/ActionL1Loss=0.0644 + throughput/total_tokens=957,888,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4990/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=958,080,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=4991/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=958,272,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4992/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=958,464,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=4993/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=958,656,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4994/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=958,848,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4995/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=959,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4996/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=959,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=4997/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=959,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4998/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=959,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=4999/500000] + train/ActionL1Loss=0.0562 + throughput/total_tokens=959,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5000/500000] + optim/total_grad_norm=8.091 + train/ActionL1Loss=0.0550 + throughput/total_tokens=960,000,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +10/12 [21:43:16] INFO | >> Saving config... checkpoint.py:608 +10/12 [21:43:47] INFO | >> Saving model state... checkpoint.py:796 +10/12 [21:44:55] INFO | >> Saving optim state... checkpoint.py:811 +10/12 [21:46:27] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=5001/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=960,192,000 + throughput/device/tokens_per_second=1,211 + throughput/device/batches_per_second=0.0505 +[step=5002/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=960,384,000 + throughput/device/tokens_per_second=1,165 + throughput/device/batches_per_second=0.0486 +[step=5003/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=960,576,000 + throughput/device/tokens_per_second=1,143 + throughput/device/batches_per_second=0.0477 +[step=5004/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=960,768,000 + throughput/device/tokens_per_second=1,149 + throughput/device/batches_per_second=0.0479 +[step=5005/500000] + train/ActionL1Loss=0.0683 + throughput/total_tokens=960,960,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5006/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=961,152,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5007/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=961,344,000 + throughput/device/tokens_per_second=1,163 + throughput/device/batches_per_second=0.0485 +[step=5008/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=961,536,000 + throughput/device/tokens_per_second=1,165 + throughput/device/batches_per_second=0.0485 +[step=5009/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=961,728,000 + throughput/device/tokens_per_second=1,166 + throughput/device/batches_per_second=0.0486 +[step=5010/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=961,920,000 + throughput/device/tokens_per_second=1,167 + throughput/device/batches_per_second=0.0486 + System/Peak GPU Memory (MB)=46,924 +[step=5011/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=962,112,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=5012/500000] + train/ActionL1Loss=0.0622 + throughput/total_tokens=962,304,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=5013/500000] + train/ActionL1Loss=0.0658 + throughput/total_tokens=962,496,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=5014/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=962,688,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=5015/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=962,880,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=5016/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=963,072,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=5017/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=963,264,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=5018/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=963,456,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=5019/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=963,648,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=5020/500000] + optim/total_grad_norm=10.87 + train/ActionL1Loss=0.0548 + throughput/total_tokens=963,840,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=5021/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=964,032,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=5022/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=964,224,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5023/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=964,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5024/500000] + train/ActionL1Loss=0.0693 + throughput/total_tokens=964,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5025/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=964,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5026/500000] + train/ActionL1Loss=0.0574 + throughput/total_tokens=964,992,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5027/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=965,184,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5028/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=965,376,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5029/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=965,568,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5030/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=965,760,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=5031/500000] + train/ActionL1Loss=0.0670 + throughput/total_tokens=965,952,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5032/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=966,144,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5033/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=966,336,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5034/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=966,528,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5035/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=966,720,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5036/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=966,912,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5037/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=967,104,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5038/500000] + train/ActionL1Loss=0.0744 + throughput/total_tokens=967,296,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5039/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=967,488,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5040/500000] + optim/total_grad_norm=9.153 + train/ActionL1Loss=0.0385 + throughput/total_tokens=967,680,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=5041/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=967,872,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5042/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=968,064,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5043/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=968,256,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5044/500000] + train/ActionL1Loss=0.0588 + throughput/total_tokens=968,448,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5045/500000] + train/ActionL1Loss=0.0650 + throughput/total_tokens=968,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5046/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=968,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5047/500000] + train/ActionL1Loss=0.0585 + throughput/total_tokens=969,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5048/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=969,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5049/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=969,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5050/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=969,600,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5051/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=969,792,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5052/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=969,984,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5053/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=970,176,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5054/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=970,368,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=5055/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=970,560,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5056/500000] + train/ActionL1Loss=0.0615 + throughput/total_tokens=970,752,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5057/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=970,944,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5058/500000] + train/ActionL1Loss=0.0658 + throughput/total_tokens=971,136,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5059/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=971,328,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5060/500000] + optim/total_grad_norm=8.042 + train/ActionL1Loss=0.0549 + throughput/total_tokens=971,520,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=5061/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=971,712,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=5062/500000] + train/ActionL1Loss=0.0666 + throughput/total_tokens=971,904,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=5063/500000] + train/ActionL1Loss=0.0627 + throughput/total_tokens=972,096,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=5064/500000] + train/ActionL1Loss=0.0693 + throughput/total_tokens=972,288,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=5065/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=972,480,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=5066/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=972,672,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=5067/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=972,864,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=5068/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=973,056,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5069/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=973,248,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5070/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=973,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5071/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=973,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5072/500000] + train/ActionL1Loss=0.0394 + throughput/total_tokens=973,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5073/500000] + train/ActionL1Loss=0.0617 + throughput/total_tokens=974,016,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5074/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=974,208,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5075/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=974,400,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5076/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=974,592,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5077/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=974,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5078/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=974,976,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5079/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=975,168,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5080/500000] + optim/total_grad_norm=9.007 + train/ActionL1Loss=0.0630 + throughput/total_tokens=975,360,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=5081/500000] + train/ActionL1Loss=0.0671 + throughput/total_tokens=975,552,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5082/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=975,744,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5083/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=975,936,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5084/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=976,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5085/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=976,320,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5086/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=976,512,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5087/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=976,704,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5088/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=976,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5089/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=977,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5090/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=977,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5091/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=977,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5092/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=977,664,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5093/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=977,856,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5094/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=978,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5095/500000] + train/ActionL1Loss=0.0668 + throughput/total_tokens=978,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5096/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=978,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5097/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=978,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5098/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=978,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5099/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=979,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5100/500000] + optim/total_grad_norm=7.573 + train/ActionL1Loss=0.0380 + throughput/total_tokens=979,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5101/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=979,392,000 + throughput/device/tokens_per_second=1,159 + throughput/device/batches_per_second=0.0483 +[step=5102/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=979,584,000 + throughput/device/tokens_per_second=1,157 + throughput/device/batches_per_second=0.0482 +[step=5103/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=979,776,000 + throughput/device/tokens_per_second=1,155 + throughput/device/batches_per_second=0.0481 +[step=5104/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=979,968,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=5105/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=980,160,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=5106/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=980,352,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=5107/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=980,544,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0481 +[step=5108/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=980,736,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=5109/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=980,928,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=5110/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=981,120,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 + System/Peak GPU Memory (MB)=46,924 +[step=5111/500000] + train/ActionL1Loss=0.0732 + throughput/total_tokens=981,312,000 + throughput/device/tokens_per_second=1,153 + throughput/device/batches_per_second=0.0480 +[step=5112/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=981,504,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=5113/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=981,696,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=5114/500000] + train/ActionL1Loss=0.0676 + throughput/total_tokens=981,888,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=5115/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=982,080,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5116/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=982,272,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5117/500000] + train/ActionL1Loss=0.0574 + throughput/total_tokens=982,464,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5118/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=982,656,000 + throughput/device/tokens_per_second=1,151 + throughput/device/batches_per_second=0.0480 +[step=5119/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=982,848,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=5120/500000] + optim/total_grad_norm=10.46 + train/ActionL1Loss=0.0352 + throughput/total_tokens=983,040,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 + System/Peak GPU Memory (MB)=46,924 +[step=5121/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=983,232,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=5122/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=983,424,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=5123/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=983,616,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5124/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=983,808,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5125/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=984,000,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5126/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=984,192,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5127/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=984,384,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5128/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=984,576,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5129/500000] + train/ActionL1Loss=0.0345 + throughput/total_tokens=984,768,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5130/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=984,960,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5131/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=985,152,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5132/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=985,344,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5133/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=985,536,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5134/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=985,728,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5135/500000] + train/ActionL1Loss=0.0650 + throughput/total_tokens=985,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5136/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=986,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5137/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=986,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5138/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=986,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5139/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=986,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5140/500000] + optim/total_grad_norm=8.757 + train/ActionL1Loss=0.0588 + throughput/total_tokens=986,880,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5141/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=987,072,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5142/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=987,264,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5143/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=987,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5144/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=987,648,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5145/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=987,840,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5146/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=988,032,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5147/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=988,224,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5148/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=988,416,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5149/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=988,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5150/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=988,800,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5151/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=988,992,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5152/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=989,184,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5153/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=989,376,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5154/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=989,568,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5155/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=989,760,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=5156/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=989,952,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5157/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=990,144,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5158/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=990,336,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5159/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=990,528,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5160/500000] + optim/total_grad_norm=8.442 + train/ActionL1Loss=0.0530 + throughput/total_tokens=990,720,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=5161/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=990,912,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=5162/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=991,104,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=5163/500000] + train/ActionL1Loss=0.0369 + throughput/total_tokens=991,296,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5164/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=991,488,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5165/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=991,680,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=5166/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=991,872,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=5167/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=992,064,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=5168/500000] + train/ActionL1Loss=0.0631 + throughput/total_tokens=992,256,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5169/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=992,448,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5170/500000] + train/ActionL1Loss=0.0700 + throughput/total_tokens=992,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5171/500000] + train/ActionL1Loss=0.0730 + throughput/total_tokens=992,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5172/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=993,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5173/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=993,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5174/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=993,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5175/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=993,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5176/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=993,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5177/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=993,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5178/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=994,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5179/500000] + train/ActionL1Loss=0.0584 + throughput/total_tokens=994,368,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5180/500000] + optim/total_grad_norm=10.05 + train/ActionL1Loss=0.0418 + throughput/total_tokens=994,560,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5181/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=994,752,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5182/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=994,944,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5183/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=995,136,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5184/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=995,328,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5185/500000] + train/ActionL1Loss=0.0738 + throughput/total_tokens=995,520,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5186/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=995,712,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5187/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=995,904,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5188/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=996,096,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5189/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=996,288,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5190/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=996,480,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=5191/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=996,672,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=5192/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=996,864,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5193/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=997,056,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5194/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=997,248,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5195/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=997,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5196/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=997,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5197/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=997,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5198/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=998,016,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5199/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=998,208,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5200/500000] + optim/total_grad_norm=9.556 + train/ActionL1Loss=0.0531 + throughput/total_tokens=998,400,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=5201/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=998,592,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=5202/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=998,784,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=5203/500000] + train/ActionL1Loss=0.0621 + throughput/total_tokens=998,976,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=5204/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=999,168,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=5205/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=999,360,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=5206/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=999,552,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=5207/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=999,744,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=5208/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=999,936,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=5209/500000] + train/ActionL1Loss=0.0665 + throughput/total_tokens=1,000,128,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=5210/500000] + train/ActionL1Loss=0.0690 + throughput/total_tokens=1,000,320,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=5211/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,000,512,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5212/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=1,000,704,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5213/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,000,896,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5214/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=1,001,088,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5215/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=1,001,280,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5216/500000] + train/ActionL1Loss=0.0638 + throughput/total_tokens=1,001,472,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5217/500000] + train/ActionL1Loss=0.0775 + throughput/total_tokens=1,001,664,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5218/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,001,856,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5219/500000] + train/ActionL1Loss=0.0772 + throughput/total_tokens=1,002,048,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5220/500000] + optim/total_grad_norm=9.370 + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,002,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=5221/500000] + train/ActionL1Loss=0.0651 + throughput/total_tokens=1,002,432,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5222/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,002,624,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5223/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=1,002,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5224/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,003,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5225/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,003,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5226/500000] + train/ActionL1Loss=0.0744 + throughput/total_tokens=1,003,392,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5227/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,003,584,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5228/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,003,776,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5229/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=1,003,968,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5230/500000] + train/ActionL1Loss=0.0669 + throughput/total_tokens=1,004,160,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=5231/500000] + train/ActionL1Loss=0.0690 + throughput/total_tokens=1,004,352,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5232/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=1,004,544,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5233/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,004,736,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5234/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,004,928,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5235/500000] + train/ActionL1Loss=0.0699 + throughput/total_tokens=1,005,120,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5236/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,005,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5237/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,005,504,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5238/500000] + train/ActionL1Loss=0.0665 + throughput/total_tokens=1,005,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5239/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,005,888,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5240/500000] + optim/total_grad_norm=7.605 + train/ActionL1Loss=0.0620 + throughput/total_tokens=1,006,080,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5241/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=1,006,272,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5242/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,006,464,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5243/500000] + train/ActionL1Loss=0.0677 + throughput/total_tokens=1,006,656,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5244/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,006,848,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5245/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,007,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5246/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,007,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5247/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,007,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5248/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,007,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5249/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=1,007,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5250/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,008,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5251/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,008,192,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5252/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,008,384,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5253/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=1,008,576,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5254/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,008,768,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5255/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,008,960,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5256/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,009,152,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5257/500000] + train/ActionL1Loss=0.0285 + throughput/total_tokens=1,009,344,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5258/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,009,536,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5259/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,009,728,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5260/500000] + optim/total_grad_norm=9.347 + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,009,920,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=5261/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=1,010,112,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=5262/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=1,010,304,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5263/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,010,496,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5264/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,010,688,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5265/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,010,880,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5266/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,011,072,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5267/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,011,264,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5268/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,011,456,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5269/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,011,648,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5270/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,011,840,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5271/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,012,032,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5272/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=1,012,224,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5273/500000] + train/ActionL1Loss=0.0585 + throughput/total_tokens=1,012,416,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5274/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=1,012,608,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5275/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=1,012,800,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5276/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,012,992,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5277/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,013,184,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5278/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,013,376,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5279/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,013,568,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5280/500000] + optim/total_grad_norm=9.351 + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,013,760,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5281/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,013,952,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5282/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,014,144,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5283/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=1,014,336,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5284/500000] + train/ActionL1Loss=0.0674 + throughput/total_tokens=1,014,528,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5285/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,014,720,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5286/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=1,014,912,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5287/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=1,015,104,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5288/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,015,296,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5289/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=1,015,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5290/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,015,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5291/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,015,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5292/500000] + train/ActionL1Loss=0.0558 + throughput/total_tokens=1,016,064,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5293/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,016,256,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5294/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,016,448,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5295/500000] + train/ActionL1Loss=0.0616 + throughput/total_tokens=1,016,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5296/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,016,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5297/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,017,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5298/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=1,017,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5299/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=1,017,408,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5300/500000] + optim/total_grad_norm=8.703 + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,017,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5301/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=1,017,792,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5302/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,017,984,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5303/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,018,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5304/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=1,018,368,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5305/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=1,018,560,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5306/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=1,018,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5307/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=1,018,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5308/500000] + train/ActionL1Loss=0.0666 + throughput/total_tokens=1,019,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5309/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=1,019,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5310/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=1,019,520,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=5311/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=1,019,712,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5312/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=1,019,904,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5313/500000] + train/ActionL1Loss=0.0644 + throughput/total_tokens=1,020,096,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5314/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=1,020,288,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5315/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,020,480,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5316/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,020,672,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5317/500000] + train/ActionL1Loss=0.0617 + throughput/total_tokens=1,020,864,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5318/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=1,021,056,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5319/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,021,248,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5320/500000] + optim/total_grad_norm=8.693 + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,021,440,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=5321/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=1,021,632,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5322/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,021,824,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5323/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,022,016,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5324/500000] + train/ActionL1Loss=0.0600 + throughput/total_tokens=1,022,208,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5325/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=1,022,400,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5326/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=1,022,592,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5327/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=1,022,784,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5328/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,022,976,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5329/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=1,023,168,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5330/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,023,360,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=5331/500000] + train/ActionL1Loss=0.0656 + throughput/total_tokens=1,023,552,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5332/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,023,744,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5333/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=1,023,936,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5334/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=1,024,128,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5335/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=1,024,320,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5336/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,024,512,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5337/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,024,704,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5338/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=1,024,896,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5339/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,025,088,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5340/500000] + optim/total_grad_norm=8.115 + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,025,280,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=5341/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,025,472,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5342/500000] + train/ActionL1Loss=0.0640 + throughput/total_tokens=1,025,664,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5343/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=1,025,856,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5344/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=1,026,048,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5345/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=1,026,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5346/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=1,026,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5347/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=1,026,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5348/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=1,026,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5349/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=1,027,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5350/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=1,027,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5351/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=1,027,392,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5352/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,027,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5353/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=1,027,776,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5354/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=1,027,968,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5355/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=1,028,160,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5356/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=1,028,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5357/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=1,028,544,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5358/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=1,028,736,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5359/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,028,928,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5360/500000] + optim/total_grad_norm=8.915 + train/ActionL1Loss=0.0302 + throughput/total_tokens=1,029,120,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=5361/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=1,029,312,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5362/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=1,029,504,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5363/500000] + train/ActionL1Loss=0.0641 + throughput/total_tokens=1,029,696,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5364/500000] + train/ActionL1Loss=0.0665 + throughput/total_tokens=1,029,888,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5365/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,030,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5366/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,030,272,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5367/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,030,464,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5368/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=1,030,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5369/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,030,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5370/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,031,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5371/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,031,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5372/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,031,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5373/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,031,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5374/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=1,031,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5375/500000] + train/ActionL1Loss=0.0722 + throughput/total_tokens=1,032,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5376/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,032,192,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5377/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,032,384,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5378/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=1,032,576,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5379/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,032,768,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5380/500000] + optim/total_grad_norm=10.03 + train/ActionL1Loss=0.0622 + throughput/total_tokens=1,032,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5381/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=1,033,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5382/500000] + train/ActionL1Loss=0.0320 + throughput/total_tokens=1,033,344,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5383/500000] + train/ActionL1Loss=0.0654 + throughput/total_tokens=1,033,536,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5384/500000] + train/ActionL1Loss=0.0627 + throughput/total_tokens=1,033,728,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5385/500000] + train/ActionL1Loss=0.0683 + throughput/total_tokens=1,033,920,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5386/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=1,034,112,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5387/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,034,304,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5388/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,034,496,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5389/500000] + train/ActionL1Loss=0.0364 + throughput/total_tokens=1,034,688,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5390/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=1,034,880,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=5391/500000] + train/ActionL1Loss=0.0328 + throughput/total_tokens=1,035,072,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5392/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=1,035,264,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5393/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=1,035,456,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5394/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=1,035,648,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5395/500000] + train/ActionL1Loss=0.0638 + throughput/total_tokens=1,035,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5396/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=1,036,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5397/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,036,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5398/500000] + train/ActionL1Loss=0.0600 + throughput/total_tokens=1,036,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5399/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=1,036,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5400/500000] + optim/total_grad_norm=9.299 + train/ActionL1Loss=0.0632 + throughput/total_tokens=1,036,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=5401/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=1,036,992,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5402/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=1,037,184,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5403/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,037,376,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5404/500000] + train/ActionL1Loss=0.0621 + throughput/total_tokens=1,037,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5405/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=1,037,760,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5406/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=1,037,952,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5407/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,038,144,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5408/500000] + train/ActionL1Loss=0.0390 + throughput/total_tokens=1,038,336,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5409/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,038,528,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5410/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=1,038,720,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5411/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=1,038,912,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5412/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=1,039,104,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5413/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=1,039,296,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5414/500000] + train/ActionL1Loss=0.0707 + throughput/total_tokens=1,039,488,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5415/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=1,039,680,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5416/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=1,039,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5417/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,040,064,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5418/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,040,256,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5419/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=1,040,448,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5420/500000] + optim/total_grad_norm=8.760 + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,040,640,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=5421/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,040,832,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5422/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,041,024,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5423/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,041,216,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5424/500000] + train/ActionL1Loss=0.0564 + throughput/total_tokens=1,041,408,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5425/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,041,600,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5426/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,041,792,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5427/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,041,984,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5428/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,042,176,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5429/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,042,368,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5430/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=1,042,560,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=5431/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,042,752,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5432/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=1,042,944,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5433/500000] + train/ActionL1Loss=0.0337 + throughput/total_tokens=1,043,136,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5434/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,043,328,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5435/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,043,520,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5436/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,043,712,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5437/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=1,043,904,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5438/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=1,044,096,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5439/500000] + train/ActionL1Loss=0.0324 + throughput/total_tokens=1,044,288,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5440/500000] + optim/total_grad_norm=7.563 + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,044,480,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=5441/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=1,044,672,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5442/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,044,864,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5443/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,045,056,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5444/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=1,045,248,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5445/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,045,440,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5446/500000] + train/ActionL1Loss=0.0359 + throughput/total_tokens=1,045,632,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5447/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,045,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5448/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,046,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5449/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=1,046,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5450/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,046,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5451/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,046,592,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5452/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,046,784,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5453/500000] + train/ActionL1Loss=0.0638 + throughput/total_tokens=1,046,976,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5454/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,047,168,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5455/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,047,360,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5456/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,047,552,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5457/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=1,047,744,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5458/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=1,047,936,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5459/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,048,128,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5460/500000] + optim/total_grad_norm=7.948 + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,048,320,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=5461/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,048,512,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5462/500000] + train/ActionL1Loss=0.0648 + throughput/total_tokens=1,048,704,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5463/500000] + train/ActionL1Loss=0.0622 + throughput/total_tokens=1,048,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5464/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,049,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5465/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=1,049,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5466/500000] + train/ActionL1Loss=0.0669 + throughput/total_tokens=1,049,472,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5467/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,049,664,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5468/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,049,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5469/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,050,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5470/500000] + train/ActionL1Loss=0.0331 + throughput/total_tokens=1,050,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=5471/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,050,432,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5472/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,050,624,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5473/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=1,050,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5474/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=1,051,008,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5475/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=1,051,200,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5476/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=1,051,392,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5477/500000] + train/ActionL1Loss=0.0585 + throughput/total_tokens=1,051,584,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5478/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,051,776,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5479/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,051,968,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5480/500000] + optim/total_grad_norm=7.241 + train/ActionL1Loss=0.0595 + throughput/total_tokens=1,052,160,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=5481/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,052,352,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5482/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=1,052,544,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5483/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,052,736,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5484/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,052,928,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5485/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,053,120,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5486/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,053,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5487/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=1,053,504,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5488/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=1,053,696,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5489/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=1,053,888,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5490/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=1,054,080,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5491/500000] + train/ActionL1Loss=0.0642 + throughput/total_tokens=1,054,272,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5492/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,054,464,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5493/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,054,656,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5494/500000] + train/ActionL1Loss=0.0368 + throughput/total_tokens=1,054,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5495/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,055,040,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5496/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,055,232,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5497/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,055,424,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5498/500000] + train/ActionL1Loss=0.0685 + throughput/total_tokens=1,055,616,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5499/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,055,808,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5500/500000] + optim/total_grad_norm=8.153 + train/ActionL1Loss=0.0557 + throughput/total_tokens=1,056,000,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +10/13 [00:37:47] INFO | >> Saving config... checkpoint.py:608 +10/13 [00:38:29] INFO | >> Saving model state... checkpoint.py:796 +10/13 [00:39:41] INFO | >> Saving optim state... checkpoint.py:811 +10/13 [00:41:12] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=5501/500000] + train/ActionL1Loss=0.0615 + throughput/total_tokens=1,056,192,000 + throughput/device/tokens_per_second=1,211 + throughput/device/batches_per_second=0.0505 +[step=5502/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,056,384,000 + throughput/device/tokens_per_second=1,161 + throughput/device/batches_per_second=0.0484 +[step=5503/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,056,576,000 + throughput/device/tokens_per_second=1,152 + throughput/device/batches_per_second=0.0480 +[step=5504/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=1,056,768,000 + throughput/device/tokens_per_second=1,156 + throughput/device/batches_per_second=0.0482 +[step=5505/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,056,960,000 + throughput/device/tokens_per_second=1,160 + throughput/device/batches_per_second=0.0484 +[step=5506/500000] + train/ActionL1Loss=0.0587 + throughput/total_tokens=1,057,152,000 + throughput/device/tokens_per_second=1,165 + throughput/device/batches_per_second=0.0486 +[step=5507/500000] + train/ActionL1Loss=0.0564 + throughput/total_tokens=1,057,344,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=5508/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,057,536,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=5509/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=1,057,728,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=5510/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=1,057,920,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 + System/Peak GPU Memory (MB)=46,924 +[step=5511/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,058,112,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=5512/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=1,058,304,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=5513/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=1,058,496,000 + throughput/device/tokens_per_second=1,168 + throughput/device/batches_per_second=0.0487 +[step=5514/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,058,688,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=5515/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,058,880,000 + throughput/device/tokens_per_second=1,169 + throughput/device/batches_per_second=0.0487 +[step=5516/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=1,059,072,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=5517/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=1,059,264,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=5518/500000] + train/ActionL1Loss=0.0625 + throughput/total_tokens=1,059,456,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=5519/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,059,648,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=5520/500000] + optim/total_grad_norm=8.703 + train/ActionL1Loss=0.0615 + throughput/total_tokens=1,059,840,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=5521/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=1,060,032,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=5522/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,060,224,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5523/500000] + train/ActionL1Loss=0.0368 + throughput/total_tokens=1,060,416,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5524/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=1,060,608,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5525/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,060,800,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5526/500000] + train/ActionL1Loss=0.0635 + throughput/total_tokens=1,060,992,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5527/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=1,061,184,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5528/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=1,061,376,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5529/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,061,568,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5530/500000] + train/ActionL1Loss=0.0336 + throughput/total_tokens=1,061,760,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5531/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=1,061,952,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5532/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,062,144,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5533/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,062,336,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5534/500000] + train/ActionL1Loss=0.0343 + throughput/total_tokens=1,062,528,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5535/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,062,720,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5536/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=1,062,912,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5537/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,063,104,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5538/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=1,063,296,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5539/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,063,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5540/500000] + optim/total_grad_norm=7.012 + train/ActionL1Loss=0.0567 + throughput/total_tokens=1,063,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5541/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,063,872,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5542/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=1,064,064,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5543/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,064,256,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5544/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,064,448,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5545/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,064,640,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5546/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,064,832,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5547/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=1,065,024,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5548/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,065,216,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5549/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=1,065,408,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5550/500000] + train/ActionL1Loss=0.0558 + throughput/total_tokens=1,065,600,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=5551/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,065,792,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=5552/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=1,065,984,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5553/500000] + train/ActionL1Loss=0.0690 + throughput/total_tokens=1,066,176,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=5554/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,066,368,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5555/500000] + train/ActionL1Loss=0.0675 + throughput/total_tokens=1,066,560,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5556/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,066,752,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5557/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=1,066,944,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5558/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,067,136,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5559/500000] + train/ActionL1Loss=0.0394 + throughput/total_tokens=1,067,328,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5560/500000] + optim/total_grad_norm=9.641 + train/ActionL1Loss=0.0555 + throughput/total_tokens=1,067,520,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=5561/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,067,712,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5562/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=1,067,904,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5563/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=1,068,096,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5564/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,068,288,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5565/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,068,480,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5566/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=1,068,672,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5567/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=1,068,864,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5568/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,069,056,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5569/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,069,248,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5570/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=1,069,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5571/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,069,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5572/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,069,824,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5573/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,070,016,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5574/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,070,208,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5575/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,070,400,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5576/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,070,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5577/500000] + train/ActionL1Loss=0.0628 + throughput/total_tokens=1,070,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5578/500000] + train/ActionL1Loss=0.0292 + throughput/total_tokens=1,070,976,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5579/500000] + train/ActionL1Loss=0.0585 + throughput/total_tokens=1,071,168,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5580/500000] + optim/total_grad_norm=10.18 + train/ActionL1Loss=0.0735 + throughput/total_tokens=1,071,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5581/500000] + train/ActionL1Loss=0.0623 + throughput/total_tokens=1,071,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5582/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=1,071,744,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5583/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=1,071,936,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5584/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,072,128,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5585/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,072,320,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5586/500000] + train/ActionL1Loss=0.0359 + throughput/total_tokens=1,072,512,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5587/500000] + train/ActionL1Loss=0.0640 + throughput/total_tokens=1,072,704,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5588/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,072,896,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5589/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=1,073,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5590/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=1,073,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5591/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=1,073,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5592/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,073,664,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5593/500000] + train/ActionL1Loss=0.0619 + throughput/total_tokens=1,073,856,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5594/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,074,048,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5595/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,074,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5596/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=1,074,432,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5597/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,074,624,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5598/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=1,074,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5599/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,075,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5600/500000] + optim/total_grad_norm=9.520 + train/ActionL1Loss=0.0675 + throughput/total_tokens=1,075,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5601/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,075,392,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5602/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=1,075,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5603/500000] + train/ActionL1Loss=0.0585 + throughput/total_tokens=1,075,776,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5604/500000] + train/ActionL1Loss=0.0394 + throughput/total_tokens=1,075,968,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5605/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=1,076,160,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5606/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=1,076,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5607/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=1,076,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5608/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,076,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5609/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=1,076,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5610/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=1,077,120,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=5611/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,077,312,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5612/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=1,077,504,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5613/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,077,696,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5614/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=1,077,888,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5615/500000] + train/ActionL1Loss=0.0247 + throughput/total_tokens=1,078,080,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5616/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=1,078,272,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5617/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,078,464,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5618/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=1,078,656,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5619/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,078,848,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5620/500000] + optim/total_grad_norm=6.851 + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,079,040,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=5621/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,079,232,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5622/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,079,424,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5623/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,079,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5624/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,079,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5625/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,080,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5626/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,080,192,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5627/500000] + train/ActionL1Loss=0.0336 + throughput/total_tokens=1,080,384,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5628/500000] + train/ActionL1Loss=0.0394 + throughput/total_tokens=1,080,576,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5629/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=1,080,768,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5630/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=1,080,960,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5631/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,081,152,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5632/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=1,081,344,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5633/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,081,536,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5634/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,081,728,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5635/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,081,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5636/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,082,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5637/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=1,082,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5638/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=1,082,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5639/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=1,082,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5640/500000] + optim/total_grad_norm=8.697 + train/ActionL1Loss=0.0498 + throughput/total_tokens=1,082,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5641/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=1,083,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5642/500000] + train/ActionL1Loss=0.0629 + throughput/total_tokens=1,083,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5643/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=1,083,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5644/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,083,648,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5645/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=1,083,840,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5646/500000] + train/ActionL1Loss=0.0338 + throughput/total_tokens=1,084,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5647/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,084,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5648/500000] + train/ActionL1Loss=0.0643 + throughput/total_tokens=1,084,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5649/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,084,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5650/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=1,084,800,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5651/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,084,992,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5652/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=1,085,184,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5653/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=1,085,376,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5654/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=1,085,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5655/500000] + train/ActionL1Loss=0.0627 + throughput/total_tokens=1,085,760,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5656/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=1,085,952,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5657/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,086,144,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5658/500000] + train/ActionL1Loss=0.0334 + throughput/total_tokens=1,086,336,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5659/500000] + train/ActionL1Loss=0.0321 + throughput/total_tokens=1,086,528,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5660/500000] + optim/total_grad_norm=9.065 + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,086,720,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=5661/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,086,912,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5662/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,087,104,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5663/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,087,296,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5664/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,087,488,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5665/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,087,680,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5666/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=1,087,872,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5667/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,088,064,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5668/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,088,256,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5669/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,088,448,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5670/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,088,640,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5671/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=1,088,832,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5672/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,089,024,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5673/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=1,089,216,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5674/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=1,089,408,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5675/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,089,600,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5676/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=1,089,792,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5677/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=1,089,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5678/500000] + train/ActionL1Loss=0.0294 + throughput/total_tokens=1,090,176,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5679/500000] + train/ActionL1Loss=0.0708 + throughput/total_tokens=1,090,368,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5680/500000] + optim/total_grad_norm=9.308 + train/ActionL1Loss=0.0339 + throughput/total_tokens=1,090,560,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5681/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=1,090,752,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5682/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=1,090,944,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5683/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=1,091,136,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5684/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=1,091,328,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5685/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=1,091,520,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5686/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,091,712,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5687/500000] + train/ActionL1Loss=0.0678 + throughput/total_tokens=1,091,904,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5688/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,092,096,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5689/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=1,092,288,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5690/500000] + train/ActionL1Loss=0.0658 + throughput/total_tokens=1,092,480,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5691/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,092,672,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5692/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,092,864,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5693/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=1,093,056,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5694/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=1,093,248,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5695/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=1,093,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5696/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,093,632,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5697/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,093,824,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5698/500000] + train/ActionL1Loss=0.0615 + throughput/total_tokens=1,094,016,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5699/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=1,094,208,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5700/500000] + optim/total_grad_norm=8.567 + train/ActionL1Loss=0.0600 + throughput/total_tokens=1,094,400,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=5701/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,094,592,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5702/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,094,784,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5703/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,094,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5704/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=1,095,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5705/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,095,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5706/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,095,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5707/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=1,095,744,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5708/500000] + train/ActionL1Loss=0.0280 + throughput/total_tokens=1,095,936,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5709/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=1,096,128,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5710/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,096,320,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=5711/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=1,096,512,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5712/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=1,096,704,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5713/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,096,896,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5714/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=1,097,088,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5715/500000] + train/ActionL1Loss=0.0611 + throughput/total_tokens=1,097,280,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5716/500000] + train/ActionL1Loss=0.0325 + throughput/total_tokens=1,097,472,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5717/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=1,097,664,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5718/500000] + train/ActionL1Loss=0.0562 + throughput/total_tokens=1,097,856,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5719/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,098,048,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5720/500000] + optim/total_grad_norm=8.211 + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,098,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5721/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,098,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5722/500000] + train/ActionL1Loss=0.0706 + throughput/total_tokens=1,098,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5723/500000] + train/ActionL1Loss=0.0638 + throughput/total_tokens=1,098,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5724/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=1,099,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5725/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,099,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5726/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,099,392,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5727/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=1,099,584,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5728/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=1,099,776,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5729/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=1,099,968,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5730/500000] + train/ActionL1Loss=0.0642 + throughput/total_tokens=1,100,160,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5731/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=1,100,352,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5732/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,100,544,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5733/500000] + train/ActionL1Loss=0.0665 + throughput/total_tokens=1,100,736,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5734/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,100,928,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5735/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,101,120,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5736/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=1,101,312,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5737/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,101,504,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5738/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,101,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5739/500000] + train/ActionL1Loss=0.0387 + throughput/total_tokens=1,101,888,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5740/500000] + optim/total_grad_norm=9.803 + train/ActionL1Loss=0.0379 + throughput/total_tokens=1,102,080,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5741/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=1,102,272,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5742/500000] + train/ActionL1Loss=0.0628 + throughput/total_tokens=1,102,464,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5743/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=1,102,656,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5744/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=1,102,848,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5745/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,103,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5746/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=1,103,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5747/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,103,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5748/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,103,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5749/500000] + train/ActionL1Loss=0.0394 + throughput/total_tokens=1,103,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5750/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=1,104,000,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5751/500000] + train/ActionL1Loss=0.0587 + throughput/total_tokens=1,104,192,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5752/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,104,384,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5753/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=1,104,576,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5754/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,104,768,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5755/500000] + train/ActionL1Loss=0.0353 + throughput/total_tokens=1,104,960,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=5756/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=1,105,152,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=5757/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,105,344,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=5758/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,105,536,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5759/500000] + train/ActionL1Loss=0.0558 + throughput/total_tokens=1,105,728,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5760/500000] + optim/total_grad_norm=5.617 + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,105,920,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5761/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,106,112,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5762/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=1,106,304,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5763/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=1,106,496,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5764/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=1,106,688,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5765/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=1,106,880,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5766/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,107,072,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5767/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=1,107,264,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5768/500000] + train/ActionL1Loss=0.0292 + throughput/total_tokens=1,107,456,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5769/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=1,107,648,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5770/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=1,107,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5771/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,108,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5772/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=1,108,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5773/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=1,108,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5774/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,108,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5775/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=1,108,800,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5776/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,108,992,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5777/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=1,109,184,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5778/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,109,376,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5779/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=1,109,568,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5780/500000] + optim/total_grad_norm=9.312 + train/ActionL1Loss=0.0587 + throughput/total_tokens=1,109,760,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=5781/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=1,109,952,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5782/500000] + train/ActionL1Loss=0.0387 + throughput/total_tokens=1,110,144,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5783/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=1,110,336,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5784/500000] + train/ActionL1Loss=0.0651 + throughput/total_tokens=1,110,528,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5785/500000] + train/ActionL1Loss=0.0390 + throughput/total_tokens=1,110,720,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5786/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,110,912,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5787/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=1,111,104,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5788/500000] + train/ActionL1Loss=0.0562 + throughput/total_tokens=1,111,296,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5789/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=1,111,488,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5790/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=1,111,680,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=5791/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=1,111,872,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5792/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=1,112,064,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5793/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=1,112,256,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5794/500000] + train/ActionL1Loss=0.0624 + throughput/total_tokens=1,112,448,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5795/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,112,640,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5796/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,112,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5797/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=1,113,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5798/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=1,113,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5799/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,113,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5800/500000] + optim/total_grad_norm=8.962 + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,113,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5801/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=1,113,792,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5802/500000] + train/ActionL1Loss=0.0328 + throughput/total_tokens=1,113,984,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5803/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,114,176,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5804/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,114,368,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5805/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=1,114,560,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5806/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=1,114,752,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=5807/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,114,944,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5808/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=1,115,136,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=5809/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,115,328,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=5810/500000] + train/ActionL1Loss=0.0290 + throughput/total_tokens=1,115,520,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 + System/Peak GPU Memory (MB)=46,924 +[step=5811/500000] + train/ActionL1Loss=0.0288 + throughput/total_tokens=1,115,712,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=5812/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,115,904,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=5813/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=1,116,096,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=5814/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=1,116,288,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=5815/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=1,116,480,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=5816/500000] + train/ActionL1Loss=0.0259 + throughput/total_tokens=1,116,672,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=5817/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,116,864,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=5818/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,117,056,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=5819/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=1,117,248,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=5820/500000] + optim/total_grad_norm=8.809 + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,117,440,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=5821/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=1,117,632,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5822/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=1,117,824,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5823/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=1,118,016,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5824/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,118,208,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5825/500000] + train/ActionL1Loss=0.0623 + throughput/total_tokens=1,118,400,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5826/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=1,118,592,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5827/500000] + train/ActionL1Loss=0.0679 + throughput/total_tokens=1,118,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5828/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=1,118,976,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5829/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,119,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5830/500000] + train/ActionL1Loss=0.0615 + throughput/total_tokens=1,119,360,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5831/500000] + train/ActionL1Loss=0.0628 + throughput/total_tokens=1,119,552,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5832/500000] + train/ActionL1Loss=0.0618 + throughput/total_tokens=1,119,744,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5833/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=1,119,936,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5834/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,120,128,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5835/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,120,320,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5836/500000] + train/ActionL1Loss=0.0322 + throughput/total_tokens=1,120,512,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5837/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=1,120,704,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5838/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=1,120,896,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5839/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,121,088,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5840/500000] + optim/total_grad_norm=9.084 + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,121,280,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=5841/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,121,472,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5842/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=1,121,664,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5843/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,121,856,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5844/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,122,048,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5845/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,122,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5846/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=1,122,432,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5847/500000] + train/ActionL1Loss=0.0667 + throughput/total_tokens=1,122,624,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5848/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=1,122,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5849/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=1,123,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5850/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,123,200,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=5851/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=1,123,392,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5852/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,123,584,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5853/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,123,776,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5854/500000] + train/ActionL1Loss=0.0297 + throughput/total_tokens=1,123,968,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5855/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=1,124,160,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5856/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=1,124,352,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5857/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,124,544,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5858/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=1,124,736,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5859/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,124,928,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5860/500000] + optim/total_grad_norm=8.412 + train/ActionL1Loss=0.0518 + throughput/total_tokens=1,125,120,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5861/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=1,125,312,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5862/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,125,504,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5863/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=1,125,696,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5864/500000] + train/ActionL1Loss=0.0276 + throughput/total_tokens=1,125,888,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5865/500000] + train/ActionL1Loss=0.0657 + throughput/total_tokens=1,126,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5866/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=1,126,272,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5867/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,126,464,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5868/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=1,126,656,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5869/500000] + train/ActionL1Loss=0.0695 + throughput/total_tokens=1,126,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5870/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,127,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5871/500000] + train/ActionL1Loss=0.0564 + throughput/total_tokens=1,127,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5872/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,127,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5873/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,127,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5874/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,127,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5875/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,128,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5876/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=1,128,192,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5877/500000] + train/ActionL1Loss=0.0632 + throughput/total_tokens=1,128,384,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5878/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,128,576,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5879/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,128,768,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5880/500000] + optim/total_grad_norm=8.807 + train/ActionL1Loss=0.0593 + throughput/total_tokens=1,128,960,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5881/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=1,129,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5882/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,129,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5883/500000] + train/ActionL1Loss=0.0588 + throughput/total_tokens=1,129,536,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=5884/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=1,129,728,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5885/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=1,129,920,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5886/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=1,130,112,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5887/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=1,130,304,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5888/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,130,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5889/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=1,130,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5890/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,130,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5891/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,131,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5892/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,131,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5893/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=1,131,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5894/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,131,648,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5895/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=1,131,840,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5896/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=1,132,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5897/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,132,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5898/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=1,132,416,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5899/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=1,132,608,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5900/500000] + optim/total_grad_norm=10.31 + train/ActionL1Loss=0.0576 + throughput/total_tokens=1,132,800,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5901/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,132,992,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=5902/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,133,184,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5903/500000] + train/ActionL1Loss=0.0719 + throughput/total_tokens=1,133,376,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5904/500000] + train/ActionL1Loss=0.0353 + throughput/total_tokens=1,133,568,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5905/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,133,760,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5906/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=1,133,952,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5907/500000] + train/ActionL1Loss=0.0364 + throughput/total_tokens=1,134,144,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5908/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,134,336,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5909/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,134,528,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5910/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,134,720,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=5911/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=1,134,912,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5912/500000] + train/ActionL1Loss=0.0675 + throughput/total_tokens=1,135,104,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5913/500000] + train/ActionL1Loss=0.0289 + throughput/total_tokens=1,135,296,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5914/500000] + train/ActionL1Loss=0.0625 + throughput/total_tokens=1,135,488,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=5915/500000] + train/ActionL1Loss=0.0674 + throughput/total_tokens=1,135,680,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5916/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,135,872,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5917/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=1,136,064,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5918/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=1,136,256,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5919/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,136,448,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=5920/500000] + optim/total_grad_norm=8.496 + train/ActionL1Loss=0.0576 + throughput/total_tokens=1,136,640,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5921/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=1,136,832,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5922/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,137,024,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5923/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=1,137,216,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5924/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=1,137,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5925/500000] + train/ActionL1Loss=0.0338 + throughput/total_tokens=1,137,600,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5926/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=1,137,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5927/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=1,137,984,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5928/500000] + train/ActionL1Loss=0.0272 + throughput/total_tokens=1,138,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5929/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,138,368,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=5930/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=1,138,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=5931/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=1,138,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5932/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,138,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=5933/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=1,139,136,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5934/500000] + train/ActionL1Loss=0.0668 + throughput/total_tokens=1,139,328,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5935/500000] + train/ActionL1Loss=0.0674 + throughput/total_tokens=1,139,520,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5936/500000] + train/ActionL1Loss=0.0658 + throughput/total_tokens=1,139,712,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5937/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,139,904,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5938/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,140,096,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5939/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=1,140,288,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5940/500000] + optim/total_grad_norm=8.398 + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,140,480,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5941/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=1,140,672,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5942/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,140,864,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5943/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,141,056,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5944/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,141,248,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5945/500000] + train/ActionL1Loss=0.0713 + throughput/total_tokens=1,141,440,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5946/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=1,141,632,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5947/500000] + train/ActionL1Loss=0.0669 + throughput/total_tokens=1,141,824,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5948/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=1,142,016,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5949/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,142,208,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=5950/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=1,142,400,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=5951/500000] + train/ActionL1Loss=0.0640 + throughput/total_tokens=1,142,592,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5952/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,142,784,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=5953/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,142,976,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5954/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,143,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5955/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,143,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5956/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,143,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5957/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=1,143,744,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5958/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,143,936,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5959/500000] + train/ActionL1Loss=0.0353 + throughput/total_tokens=1,144,128,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5960/500000] + optim/total_grad_norm=7.846 + train/ActionL1Loss=0.0518 + throughput/total_tokens=1,144,320,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5961/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=1,144,512,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5962/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=1,144,704,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5963/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=1,144,896,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5964/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=1,145,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5965/500000] + train/ActionL1Loss=0.0607 + throughput/total_tokens=1,145,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5966/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,145,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5967/500000] + train/ActionL1Loss=0.0683 + throughput/total_tokens=1,145,664,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5968/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,145,856,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5969/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=1,146,048,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=5970/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=1,146,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5971/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=1,146,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5972/500000] + train/ActionL1Loss=0.0751 + throughput/total_tokens=1,146,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5973/500000] + train/ActionL1Loss=0.0306 + throughput/total_tokens=1,146,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5974/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,147,008,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5975/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,147,200,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5976/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=1,147,392,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5977/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=1,147,584,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5978/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=1,147,776,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5979/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=1,147,968,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5980/500000] + optim/total_grad_norm=8.723 + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,148,160,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5981/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,148,352,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5982/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,148,544,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5983/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,148,736,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5984/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,148,928,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5985/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=1,149,120,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5986/500000] + train/ActionL1Loss=0.0627 + throughput/total_tokens=1,149,312,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5987/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=1,149,504,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5988/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=1,149,696,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5989/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,149,888,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5990/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,150,080,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=5991/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,150,272,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5992/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=1,150,464,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=5993/500000] + train/ActionL1Loss=0.0312 + throughput/total_tokens=1,150,656,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5994/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,150,848,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5995/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=1,151,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5996/500000] + train/ActionL1Loss=0.0574 + throughput/total_tokens=1,151,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5997/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=1,151,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=5998/500000] + train/ActionL1Loss=0.0625 + throughput/total_tokens=1,151,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=5999/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,151,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6000/500000] + optim/total_grad_norm=8.336 + train/ActionL1Loss=0.0577 + throughput/total_tokens=1,152,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +10/13 [03:32:45] INFO | >> Saving config... checkpoint.py:608 +10/13 [03:33:17] INFO | >> Saving model state... checkpoint.py:796 +10/13 [03:34:28] INFO | >> Saving optim state... checkpoint.py:811 +10/13 [03:36:01] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=6001/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=1,152,192,000 + throughput/device/tokens_per_second=1,210 + throughput/device/batches_per_second=0.0504 +[step=6002/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,152,384,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6003/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,152,576,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6004/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,152,768,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6005/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,152,960,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6006/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=1,153,152,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6007/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,153,344,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6008/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=1,153,536,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6009/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,153,728,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6010/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,153,920,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=6011/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=1,154,112,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6012/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,154,304,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6013/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,154,496,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6014/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,154,688,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6015/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,154,880,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6016/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=1,155,072,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6017/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=1,155,264,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6018/500000] + train/ActionL1Loss=0.0616 + throughput/total_tokens=1,155,456,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6019/500000] + train/ActionL1Loss=0.0651 + throughput/total_tokens=1,155,648,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6020/500000] + optim/total_grad_norm=7.814 + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,155,840,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=6021/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,156,032,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6022/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,156,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6023/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=1,156,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6024/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,156,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6025/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=1,156,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6026/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,156,992,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6027/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,157,184,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6028/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,157,376,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6029/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,157,568,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6030/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,157,760,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6031/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=1,157,952,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6032/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=1,158,144,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6033/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=1,158,336,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6034/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,158,528,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6035/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=1,158,720,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6036/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,158,912,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6037/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=1,159,104,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6038/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,159,296,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6039/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,159,488,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6040/500000] + optim/total_grad_norm=8.209 + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,159,680,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6041/500000] + train/ActionL1Loss=0.0666 + throughput/total_tokens=1,159,872,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6042/500000] + train/ActionL1Loss=0.0267 + throughput/total_tokens=1,160,064,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6043/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,160,256,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6044/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,160,448,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6045/500000] + train/ActionL1Loss=0.0676 + throughput/total_tokens=1,160,640,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6046/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,160,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6047/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,161,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6048/500000] + train/ActionL1Loss=0.0716 + throughput/total_tokens=1,161,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6049/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=1,161,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6050/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,161,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6051/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,161,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6052/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=1,161,984,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6053/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=1,162,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6054/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=1,162,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6055/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,162,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6056/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,162,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6057/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=1,162,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6058/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,163,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6059/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,163,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6060/500000] + optim/total_grad_norm=9.939 + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,163,520,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=6061/500000] + train/ActionL1Loss=0.0627 + throughput/total_tokens=1,163,712,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6062/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,163,904,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6063/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,164,096,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6064/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=1,164,288,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6065/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=1,164,480,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6066/500000] + train/ActionL1Loss=0.0651 + throughput/total_tokens=1,164,672,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6067/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,164,864,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6068/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,165,056,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6069/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,165,248,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6070/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=1,165,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6071/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,165,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6072/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=1,165,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6073/500000] + train/ActionL1Loss=0.0337 + throughput/total_tokens=1,166,016,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6074/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,166,208,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6075/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,166,400,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6076/500000] + train/ActionL1Loss=0.0645 + throughput/total_tokens=1,166,592,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6077/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=1,166,784,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6078/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,166,976,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6079/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,167,168,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6080/500000] + optim/total_grad_norm=8.365 + train/ActionL1Loss=0.0499 + throughput/total_tokens=1,167,360,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=6081/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=1,167,552,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6082/500000] + train/ActionL1Loss=0.0334 + throughput/total_tokens=1,167,744,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6083/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,167,936,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6084/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,168,128,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6085/500000] + train/ActionL1Loss=0.0607 + throughput/total_tokens=1,168,320,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6086/500000] + train/ActionL1Loss=0.0675 + throughput/total_tokens=1,168,512,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6087/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,168,704,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6088/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=1,168,896,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6089/500000] + train/ActionL1Loss=0.0642 + throughput/total_tokens=1,169,088,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6090/500000] + train/ActionL1Loss=0.0667 + throughput/total_tokens=1,169,280,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6091/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=1,169,472,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6092/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,169,664,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6093/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,169,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6094/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,170,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6095/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=1,170,240,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6096/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,170,432,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6097/500000] + train/ActionL1Loss=0.0346 + throughput/total_tokens=1,170,624,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6098/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,170,816,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6099/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,171,008,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6100/500000] + optim/total_grad_norm=8.191 + train/ActionL1Loss=0.0335 + throughput/total_tokens=1,171,200,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=6101/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=1,171,392,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6102/500000] + train/ActionL1Loss=0.0328 + throughput/total_tokens=1,171,584,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6103/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=1,171,776,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6104/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,171,968,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6105/500000] + train/ActionL1Loss=0.0356 + throughput/total_tokens=1,172,160,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6106/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=1,172,352,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6107/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=1,172,544,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6108/500000] + train/ActionL1Loss=0.0698 + throughput/total_tokens=1,172,736,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6109/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=1,172,928,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6110/500000] + train/ActionL1Loss=0.0338 + throughput/total_tokens=1,173,120,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=6111/500000] + train/ActionL1Loss=0.0618 + throughput/total_tokens=1,173,312,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6112/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,173,504,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6113/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,173,696,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6114/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=1,173,888,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=6115/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=1,174,080,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6116/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,174,272,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6117/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,174,464,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6118/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=1,174,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6119/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=1,174,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6120/500000] + optim/total_grad_norm=8.524 + train/ActionL1Loss=0.0371 + throughput/total_tokens=1,175,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6121/500000] + train/ActionL1Loss=0.0358 + throughput/total_tokens=1,175,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6122/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,175,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6123/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,175,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6124/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,175,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6125/500000] + train/ActionL1Loss=0.0368 + throughput/total_tokens=1,176,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6126/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=1,176,192,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6127/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=1,176,384,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6128/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,176,576,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6129/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,176,768,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6130/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,176,960,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6131/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,177,152,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6132/500000] + train/ActionL1Loss=0.0771 + throughput/total_tokens=1,177,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6133/500000] + train/ActionL1Loss=0.0642 + throughput/total_tokens=1,177,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6134/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,177,728,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6135/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=1,177,920,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6136/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,178,112,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6137/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,178,304,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6138/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=1,178,496,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6139/500000] + train/ActionL1Loss=0.0634 + throughput/total_tokens=1,178,688,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6140/500000] + optim/total_grad_norm=7.852 + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,178,880,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6141/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,179,072,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6142/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,179,264,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6143/500000] + train/ActionL1Loss=0.0642 + throughput/total_tokens=1,179,456,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6144/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=1,179,648,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6145/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=1,179,840,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6146/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,180,032,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6147/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,180,224,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6148/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,180,416,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6149/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,180,608,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6150/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,180,800,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=6151/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,180,992,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6152/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=1,181,184,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6153/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,181,376,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6154/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=1,181,568,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6155/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,181,760,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6156/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,181,952,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6157/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,182,144,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6158/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=1,182,336,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6159/500000] + train/ActionL1Loss=0.0562 + throughput/total_tokens=1,182,528,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6160/500000] + optim/total_grad_norm=9.110 + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,182,720,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6161/500000] + train/ActionL1Loss=0.0600 + throughput/total_tokens=1,182,912,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6162/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,183,104,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6163/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,183,296,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6164/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=1,183,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6165/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,183,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6166/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,183,872,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6167/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=1,184,064,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6168/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=1,184,256,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6169/500000] + train/ActionL1Loss=0.0318 + throughput/total_tokens=1,184,448,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6170/500000] + train/ActionL1Loss=0.0294 + throughput/total_tokens=1,184,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6171/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,184,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6172/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,185,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6173/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,185,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6174/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=1,185,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6175/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=1,185,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6176/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,185,792,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6177/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=1,185,984,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6178/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=1,186,176,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6179/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=1,186,368,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6180/500000] + optim/total_grad_norm=8.249 + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,186,560,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6181/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=1,186,752,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6182/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=1,186,944,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6183/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=1,187,136,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6184/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,187,328,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6185/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,187,520,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6186/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=1,187,712,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6187/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,187,904,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6188/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=1,188,096,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6189/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,188,288,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6190/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=1,188,480,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6191/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=1,188,672,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6192/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,188,864,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6193/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=1,189,056,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6194/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,189,248,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6195/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,189,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6196/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,189,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6197/500000] + train/ActionL1Loss=0.0645 + throughput/total_tokens=1,189,824,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6198/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=1,190,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6199/500000] + train/ActionL1Loss=0.0618 + throughput/total_tokens=1,190,208,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6200/500000] + optim/total_grad_norm=9.229 + train/ActionL1Loss=0.0560 + throughput/total_tokens=1,190,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6201/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,190,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6202/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,190,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6203/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=1,190,976,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6204/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=1,191,168,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6205/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,191,360,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6206/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,191,552,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6207/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,191,744,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6208/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,191,936,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6209/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=1,192,128,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6210/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,192,320,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=6211/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,192,512,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6212/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,192,704,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6213/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=1,192,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6214/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,193,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6215/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=1,193,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6216/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=1,193,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6217/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=1,193,664,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6218/500000] + train/ActionL1Loss=0.0625 + throughput/total_tokens=1,193,856,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6219/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=1,194,048,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6220/500000] + optim/total_grad_norm=9.036 + train/ActionL1Loss=0.0407 + throughput/total_tokens=1,194,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6221/500000] + train/ActionL1Loss=0.0664 + throughput/total_tokens=1,194,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6222/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,194,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6223/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,194,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6224/500000] + train/ActionL1Loss=0.0685 + throughput/total_tokens=1,195,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6225/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=1,195,200,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6226/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=1,195,392,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6227/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=1,195,584,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6228/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,195,776,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6229/500000] + train/ActionL1Loss=0.0301 + throughput/total_tokens=1,195,968,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6230/500000] + train/ActionL1Loss=0.0669 + throughput/total_tokens=1,196,160,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6231/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,196,352,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6232/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,196,544,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6233/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,196,736,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6234/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,196,928,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6235/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,197,120,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6236/500000] + train/ActionL1Loss=0.0338 + throughput/total_tokens=1,197,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6237/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=1,197,504,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6238/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,197,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6239/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=1,197,888,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6240/500000] + optim/total_grad_norm=8.995 + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,198,080,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6241/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,198,272,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6242/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,198,464,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6243/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,198,656,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6244/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=1,198,848,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6245/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=1,199,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6246/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,199,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6247/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=1,199,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6248/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=1,199,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6249/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=1,199,808,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6250/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=1,200,000,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6251/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,200,192,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6252/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=1,200,384,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6253/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=1,200,576,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6254/500000] + train/ActionL1Loss=0.0346 + throughput/total_tokens=1,200,768,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6255/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,200,960,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6256/500000] + train/ActionL1Loss=0.0373 + throughput/total_tokens=1,201,152,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6257/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,201,344,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6258/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,201,536,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6259/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,201,728,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6260/500000] + optim/total_grad_norm=8.919 + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,201,920,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6261/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=1,202,112,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6262/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=1,202,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6263/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,202,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6264/500000] + train/ActionL1Loss=0.0347 + throughput/total_tokens=1,202,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6265/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,202,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6266/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,203,072,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6267/500000] + train/ActionL1Loss=0.0584 + throughput/total_tokens=1,203,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6268/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=1,203,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6269/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,203,648,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6270/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,203,840,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6271/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,204,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6272/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=1,204,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6273/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,204,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6274/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=1,204,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6275/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=1,204,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6276/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,204,992,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6277/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=1,205,184,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6278/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,205,376,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6279/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=1,205,568,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6280/500000] + optim/total_grad_norm=7.810 + train/ActionL1Loss=0.0398 + throughput/total_tokens=1,205,760,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6281/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,205,952,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6282/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=1,206,144,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6283/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=1,206,336,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6284/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=1,206,528,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6285/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,206,720,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6286/500000] + train/ActionL1Loss=0.0617 + throughput/total_tokens=1,206,912,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6287/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,207,104,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6288/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,207,296,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6289/500000] + train/ActionL1Loss=0.0672 + throughput/total_tokens=1,207,488,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6290/500000] + train/ActionL1Loss=0.0314 + throughput/total_tokens=1,207,680,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6291/500000] + train/ActionL1Loss=0.0262 + throughput/total_tokens=1,207,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6292/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,208,064,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6293/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,208,256,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6294/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=1,208,448,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6295/500000] + train/ActionL1Loss=0.0356 + throughput/total_tokens=1,208,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6296/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,208,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6297/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=1,209,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6298/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=1,209,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6299/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,209,408,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6300/500000] + optim/total_grad_norm=8.643 + train/ActionL1Loss=0.0511 + throughput/total_tokens=1,209,600,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6301/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,209,792,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6302/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=1,209,984,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6303/500000] + train/ActionL1Loss=0.0309 + throughput/total_tokens=1,210,176,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=6304/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=1,210,368,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6305/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=1,210,560,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6306/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=1,210,752,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6307/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=1,210,944,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6308/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,211,136,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6309/500000] + train/ActionL1Loss=0.0292 + throughput/total_tokens=1,211,328,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6310/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=1,211,520,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=6311/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=1,211,712,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=6312/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=1,211,904,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6313/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,212,096,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6314/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=1,212,288,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6315/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=1,212,480,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6316/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=1,212,672,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6317/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,212,864,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6318/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,213,056,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6319/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,213,248,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6320/500000] + optim/total_grad_norm=7.273 + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,213,440,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=6321/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=1,213,632,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6322/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,213,824,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6323/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,214,016,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6324/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=1,214,208,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6325/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,214,400,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6326/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,214,592,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6327/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=1,214,784,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6328/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,214,976,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6329/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,215,168,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6330/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=1,215,360,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6331/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,215,552,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6332/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=1,215,744,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6333/500000] + train/ActionL1Loss=0.0714 + throughput/total_tokens=1,215,936,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6334/500000] + train/ActionL1Loss=0.0676 + throughput/total_tokens=1,216,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6335/500000] + train/ActionL1Loss=0.0611 + throughput/total_tokens=1,216,320,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6336/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,216,512,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6337/500000] + train/ActionL1Loss=0.0584 + throughput/total_tokens=1,216,704,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6338/500000] + train/ActionL1Loss=0.0646 + throughput/total_tokens=1,216,896,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6339/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=1,217,088,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6340/500000] + optim/total_grad_norm=7.958 + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,217,280,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=6341/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,217,472,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=6342/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,217,664,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=6343/500000] + train/ActionL1Loss=0.0627 + throughput/total_tokens=1,217,856,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=6344/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=1,218,048,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=6345/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,218,240,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=6346/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=1,218,432,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=6347/500000] + train/ActionL1Loss=0.0306 + throughput/total_tokens=1,218,624,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6348/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,218,816,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6349/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,219,008,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6350/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,219,200,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6351/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=1,219,392,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6352/500000] + train/ActionL1Loss=0.0588 + throughput/total_tokens=1,219,584,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6353/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=1,219,776,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6354/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,219,968,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6355/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=1,220,160,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6356/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,220,352,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6357/500000] + train/ActionL1Loss=0.0349 + throughput/total_tokens=1,220,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6358/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=1,220,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6359/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,220,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6360/500000] + optim/total_grad_norm=8.154 + train/ActionL1Loss=0.0492 + throughput/total_tokens=1,221,120,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=6361/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,221,312,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6362/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,221,504,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6363/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,221,696,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6364/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,221,888,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6365/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,222,080,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6366/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=1,222,272,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6367/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,222,464,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6368/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,222,656,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6369/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=1,222,848,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6370/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,223,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6371/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,223,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6372/500000] + train/ActionL1Loss=0.0588 + throughput/total_tokens=1,223,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6373/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,223,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6374/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,223,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6375/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,224,000,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6376/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,224,192,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6377/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,224,384,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6378/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,224,576,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6379/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,224,768,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6380/500000] + optim/total_grad_norm=8.726 + train/ActionL1Loss=0.0605 + throughput/total_tokens=1,224,960,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6381/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=1,225,152,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6382/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=1,225,344,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6383/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=1,225,536,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6384/500000] + train/ActionL1Loss=0.0364 + throughput/total_tokens=1,225,728,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6385/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,225,920,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6386/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,226,112,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6387/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=1,226,304,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6388/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,226,496,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6389/500000] + train/ActionL1Loss=0.0600 + throughput/total_tokens=1,226,688,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6390/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=1,226,880,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6391/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,227,072,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6392/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,227,264,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6393/500000] + train/ActionL1Loss=0.0690 + throughput/total_tokens=1,227,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6394/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=1,227,648,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6395/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,227,840,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6396/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=1,228,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6397/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,228,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6398/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,228,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6399/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=1,228,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6400/500000] + optim/total_grad_norm=9.174 + train/ActionL1Loss=0.0349 + throughput/total_tokens=1,228,800,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6401/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=1,228,992,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6402/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=1,229,184,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6403/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=1,229,376,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6404/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,229,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6405/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,229,760,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6406/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=1,229,952,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6407/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=1,230,144,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6408/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=1,230,336,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6409/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=1,230,528,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6410/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=1,230,720,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6411/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=1,230,912,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6412/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,231,104,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6413/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,231,296,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6414/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,231,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6415/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=1,231,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6416/500000] + train/ActionL1Loss=0.0648 + throughput/total_tokens=1,231,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6417/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,232,064,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6418/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=1,232,256,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6419/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,232,448,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6420/500000] + optim/total_grad_norm=9.438 + train/ActionL1Loss=0.0646 + throughput/total_tokens=1,232,640,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6421/500000] + train/ActionL1Loss=0.0390 + throughput/total_tokens=1,232,832,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6422/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,233,024,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6423/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=1,233,216,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6424/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,233,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6425/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,233,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6426/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,233,792,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6427/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=1,233,984,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6428/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=1,234,176,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6429/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=1,234,368,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6430/500000] + train/ActionL1Loss=0.0387 + throughput/total_tokens=1,234,560,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6431/500000] + train/ActionL1Loss=0.0350 + throughput/total_tokens=1,234,752,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6432/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,234,944,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6433/500000] + train/ActionL1Loss=0.0337 + throughput/total_tokens=1,235,136,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6434/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=1,235,328,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6435/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,235,520,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6436/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,235,712,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6437/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,235,904,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6438/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=1,236,096,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6439/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=1,236,288,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6440/500000] + optim/total_grad_norm=7.659 + train/ActionL1Loss=0.0543 + throughput/total_tokens=1,236,480,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6441/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=1,236,672,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6442/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=1,236,864,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6443/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=1,237,056,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6444/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=1,237,248,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6445/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,237,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6446/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,237,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6447/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=1,237,824,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6448/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,238,016,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6449/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=1,238,208,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6450/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=1,238,400,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6451/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=1,238,592,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6452/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=1,238,784,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6453/500000] + train/ActionL1Loss=0.0622 + throughput/total_tokens=1,238,976,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6454/500000] + train/ActionL1Loss=0.0342 + throughput/total_tokens=1,239,168,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6455/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,239,360,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6456/500000] + train/ActionL1Loss=0.0619 + throughput/total_tokens=1,239,552,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6457/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,239,744,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6458/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,239,936,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6459/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,240,128,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6460/500000] + optim/total_grad_norm=8.608 + train/ActionL1Loss=0.0438 + throughput/total_tokens=1,240,320,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=6461/500000] + train/ActionL1Loss=0.0564 + throughput/total_tokens=1,240,512,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=6462/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,240,704,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6463/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=1,240,896,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6464/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=1,241,088,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6465/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,241,280,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6466/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=1,241,472,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6467/500000] + train/ActionL1Loss=0.0332 + throughput/total_tokens=1,241,664,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6468/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=1,241,856,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6469/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,242,048,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6470/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,242,240,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=6471/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,242,432,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6472/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=1,242,624,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6473/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,242,816,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6474/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,243,008,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6475/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,243,200,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6476/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,243,392,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6477/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=1,243,584,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6478/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=1,243,776,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6479/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,243,968,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6480/500000] + optim/total_grad_norm=8.094 + train/ActionL1Loss=0.0409 + throughput/total_tokens=1,244,160,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6481/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=1,244,352,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6482/500000] + train/ActionL1Loss=0.0346 + throughput/total_tokens=1,244,544,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6483/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,244,736,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6484/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=1,244,928,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6485/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,245,120,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6486/500000] + train/ActionL1Loss=0.0629 + throughput/total_tokens=1,245,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6487/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=1,245,504,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6488/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=1,245,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6489/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=1,245,888,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6490/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,246,080,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6491/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=1,246,272,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6492/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=1,246,464,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6493/500000] + train/ActionL1Loss=0.0264 + throughput/total_tokens=1,246,656,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6494/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,246,848,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6495/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=1,247,040,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6496/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,247,232,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6497/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,247,424,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6498/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=1,247,616,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6499/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=1,247,808,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6500/500000] + optim/total_grad_norm=8.892 + train/ActionL1Loss=0.0539 + throughput/total_tokens=1,248,000,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +10/13 [06:27:11] INFO | >> Saving config... checkpoint.py:608 +10/13 [06:27:56] INFO | >> Saving model state... checkpoint.py:796 +10/13 [06:29:09] INFO | >> Saving optim state... checkpoint.py:811 +10/13 [06:30:43] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=6501/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,248,192,000 + throughput/device/tokens_per_second=1,209 + throughput/device/batches_per_second=0.0504 +[step=6502/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=1,248,384,000 + throughput/device/tokens_per_second=1,186 + throughput/device/batches_per_second=0.0494 +[step=6503/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=1,248,576,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6504/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,248,768,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6505/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=1,248,960,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=6506/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,249,152,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6507/500000] + train/ActionL1Loss=0.0696 + throughput/total_tokens=1,249,344,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6508/500000] + train/ActionL1Loss=0.0306 + throughput/total_tokens=1,249,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6509/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=1,249,728,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6510/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=1,249,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6511/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,250,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6512/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,250,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6513/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=1,250,496,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6514/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,250,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6515/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,250,880,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6516/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=1,251,072,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6517/500000] + train/ActionL1Loss=0.0326 + throughput/total_tokens=1,251,264,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6518/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,251,456,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6519/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,251,648,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6520/500000] + optim/total_grad_norm=8.225 + train/ActionL1Loss=0.0572 + throughput/total_tokens=1,251,840,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=6521/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=1,252,032,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6522/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,252,224,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6523/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=1,252,416,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6524/500000] + train/ActionL1Loss=0.0286 + throughput/total_tokens=1,252,608,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6525/500000] + train/ActionL1Loss=0.0197 + throughput/total_tokens=1,252,800,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6526/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,252,992,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6527/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=1,253,184,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6528/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,253,376,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6529/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,253,568,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6530/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,253,760,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6531/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,253,952,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6532/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=1,254,144,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6533/500000] + train/ActionL1Loss=0.0251 + throughput/total_tokens=1,254,336,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6534/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,254,528,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6535/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,254,720,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6536/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,254,912,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6537/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,255,104,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6538/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,255,296,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6539/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=1,255,488,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6540/500000] + optim/total_grad_norm=8.643 + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,255,680,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6541/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,255,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6542/500000] + train/ActionL1Loss=0.0634 + throughput/total_tokens=1,256,064,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6543/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=1,256,256,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6544/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=1,256,448,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6545/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,256,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6546/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,256,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6547/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=1,257,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6548/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,257,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6549/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,257,408,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6550/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=1,257,600,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6551/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,257,792,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6552/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=1,257,984,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6553/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,258,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6554/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=1,258,368,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6555/500000] + train/ActionL1Loss=0.0656 + throughput/total_tokens=1,258,560,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6556/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=1,258,752,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6557/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=1,258,944,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6558/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,259,136,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6559/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,259,328,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6560/500000] + optim/total_grad_norm=8.519 + train/ActionL1Loss=0.0531 + throughput/total_tokens=1,259,520,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6561/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=1,259,712,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6562/500000] + train/ActionL1Loss=0.0321 + throughput/total_tokens=1,259,904,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6563/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,260,096,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6564/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,260,288,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6565/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,260,480,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6566/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=1,260,672,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6567/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,260,864,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6568/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,261,056,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6569/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,261,248,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6570/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,261,440,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6571/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,261,632,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6572/500000] + train/ActionL1Loss=0.0295 + throughput/total_tokens=1,261,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6573/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,262,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6574/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,262,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6575/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=1,262,400,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6576/500000] + train/ActionL1Loss=0.0611 + throughput/total_tokens=1,262,592,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6577/500000] + train/ActionL1Loss=0.0340 + throughput/total_tokens=1,262,784,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6578/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=1,262,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6579/500000] + train/ActionL1Loss=0.0624 + throughput/total_tokens=1,263,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6580/500000] + optim/total_grad_norm=8.912 + train/ActionL1Loss=0.0588 + throughput/total_tokens=1,263,360,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6581/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,263,552,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6582/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=1,263,744,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6583/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,263,936,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6584/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=1,264,128,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6585/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,264,320,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6586/500000] + train/ActionL1Loss=0.0648 + throughput/total_tokens=1,264,512,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6587/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,264,704,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6588/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,264,896,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6589/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,265,088,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6590/500000] + train/ActionL1Loss=0.0327 + throughput/total_tokens=1,265,280,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6591/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=1,265,472,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6592/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,265,664,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6593/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=1,265,856,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6594/500000] + train/ActionL1Loss=0.0287 + throughput/total_tokens=1,266,048,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6595/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=1,266,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6596/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=1,266,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6597/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=1,266,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6598/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=1,266,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6599/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=1,267,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6600/500000] + optim/total_grad_norm=8.813 + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,267,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6601/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,267,392,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6602/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,267,584,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6603/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,267,776,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6604/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=1,267,968,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6605/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,268,160,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6606/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,268,352,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6607/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,268,544,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6608/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=1,268,736,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=6609/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,268,928,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6610/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,269,120,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=6611/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=1,269,312,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6612/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,269,504,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6613/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=1,269,696,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6614/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,269,888,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6615/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,270,080,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6616/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=1,270,272,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6617/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=1,270,464,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6618/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=1,270,656,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6619/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=1,270,848,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6620/500000] + optim/total_grad_norm=8.915 + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,271,040,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=6621/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,271,232,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6622/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,271,424,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6623/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,271,616,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6624/500000] + train/ActionL1Loss=0.0627 + throughput/total_tokens=1,271,808,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6625/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,272,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6626/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=1,272,192,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6627/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=1,272,384,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6628/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=1,272,576,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6629/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,272,768,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6630/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,272,960,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6631/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,273,152,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6632/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,273,344,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6633/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,273,536,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6634/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,273,728,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6635/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,273,920,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6636/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,274,112,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6637/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=1,274,304,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6638/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=1,274,496,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6639/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,274,688,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6640/500000] + optim/total_grad_norm=7.670 + train/ActionL1Loss=0.0414 + throughput/total_tokens=1,274,880,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6641/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,275,072,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6642/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=1,275,264,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6643/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,275,456,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6644/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,275,648,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6645/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=1,275,840,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6646/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,276,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6647/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,276,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6648/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,276,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6649/500000] + train/ActionL1Loss=0.0674 + throughput/total_tokens=1,276,608,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6650/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,276,800,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6651/500000] + train/ActionL1Loss=0.0623 + throughput/total_tokens=1,276,992,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6652/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=1,277,184,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6653/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,277,376,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6654/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=1,277,568,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6655/500000] + train/ActionL1Loss=0.0648 + throughput/total_tokens=1,277,760,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6656/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,277,952,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6657/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,278,144,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6658/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,278,336,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6659/500000] + train/ActionL1Loss=0.0348 + throughput/total_tokens=1,278,528,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6660/500000] + optim/total_grad_norm=8.292 + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,278,720,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6661/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=1,278,912,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6662/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,279,104,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6663/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=1,279,296,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6664/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=1,279,488,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6665/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=1,279,680,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6666/500000] + train/ActionL1Loss=0.0672 + throughput/total_tokens=1,279,872,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6667/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,280,064,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6668/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,280,256,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6669/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,280,448,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6670/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=1,280,640,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6671/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,280,832,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6672/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,281,024,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6673/500000] + train/ActionL1Loss=0.0626 + throughput/total_tokens=1,281,216,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6674/500000] + train/ActionL1Loss=0.0619 + throughput/total_tokens=1,281,408,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6675/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,281,600,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6676/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,281,792,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6677/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,281,984,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6678/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=1,282,176,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6679/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,282,368,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6680/500000] + optim/total_grad_norm=7.640 + train/ActionL1Loss=0.0480 + throughput/total_tokens=1,282,560,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6681/500000] + train/ActionL1Loss=0.0629 + throughput/total_tokens=1,282,752,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=6682/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,282,944,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=6683/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,283,136,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=6684/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,283,328,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=6685/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=1,283,520,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6686/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,283,712,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6687/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,283,904,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6688/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=1,284,096,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6689/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=1,284,288,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6690/500000] + train/ActionL1Loss=0.0323 + throughput/total_tokens=1,284,480,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6691/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=1,284,672,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6692/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,284,864,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6693/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=1,285,056,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6694/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=1,285,248,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6695/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,285,440,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6696/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=1,285,632,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6697/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=1,285,824,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=6698/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=1,286,016,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6699/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=1,286,208,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6700/500000] + optim/total_grad_norm=9.119 + train/ActionL1Loss=0.0547 + throughput/total_tokens=1,286,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6701/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,286,592,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=6702/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=1,286,784,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=6703/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=1,286,976,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=6704/500000] + train/ActionL1Loss=0.0607 + throughput/total_tokens=1,287,168,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=6705/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,287,360,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=6706/500000] + train/ActionL1Loss=0.0688 + throughput/total_tokens=1,287,552,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6707/500000] + train/ActionL1Loss=0.0326 + throughput/total_tokens=1,287,744,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=6708/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,287,936,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6709/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,288,128,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6710/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,288,320,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 + System/Peak GPU Memory (MB)=46,924 +[step=6711/500000] + train/ActionL1Loss=0.0587 + throughput/total_tokens=1,288,512,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=6712/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,288,704,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=6713/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,288,896,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=6714/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,289,088,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=6715/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,289,280,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=6716/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=1,289,472,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=6717/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,289,664,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=6718/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=1,289,856,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=6719/500000] + train/ActionL1Loss=0.0300 + throughput/total_tokens=1,290,048,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=6720/500000] + optim/total_grad_norm=6.707 + train/ActionL1Loss=0.0544 + throughput/total_tokens=1,290,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6721/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,290,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6722/500000] + train/ActionL1Loss=0.0299 + throughput/total_tokens=1,290,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6723/500000] + train/ActionL1Loss=0.0341 + throughput/total_tokens=1,290,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6724/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,291,008,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6725/500000] + train/ActionL1Loss=0.0699 + throughput/total_tokens=1,291,200,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6726/500000] + train/ActionL1Loss=0.0348 + throughput/total_tokens=1,291,392,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6727/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=1,291,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6728/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=1,291,776,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6729/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=1,291,968,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6730/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=1,292,160,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=6731/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=1,292,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6732/500000] + train/ActionL1Loss=0.0667 + throughput/total_tokens=1,292,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6733/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,292,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6734/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,292,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6735/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=1,293,120,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6736/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=1,293,312,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6737/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,293,504,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6738/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,293,696,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6739/500000] + train/ActionL1Loss=0.0340 + throughput/total_tokens=1,293,888,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6740/500000] + optim/total_grad_norm=7.921 + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,294,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=6741/500000] + train/ActionL1Loss=0.0648 + throughput/total_tokens=1,294,272,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6742/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,294,464,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6743/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=1,294,656,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6744/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,294,848,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6745/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,295,040,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6746/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,295,232,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6747/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=1,295,424,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6748/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,295,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6749/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,295,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6750/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,296,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6751/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,296,192,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6752/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=1,296,384,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6753/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,296,576,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6754/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=1,296,768,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6755/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=1,296,960,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6756/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,297,152,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6757/500000] + train/ActionL1Loss=0.0274 + throughput/total_tokens=1,297,344,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=6758/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=1,297,536,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=6759/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=1,297,728,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6760/500000] + optim/total_grad_norm=10.33 + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,297,920,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=6761/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,298,112,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6762/500000] + train/ActionL1Loss=0.0715 + throughput/total_tokens=1,298,304,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6763/500000] + train/ActionL1Loss=0.0629 + throughput/total_tokens=1,298,496,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6764/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,298,688,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6765/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=1,298,880,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6766/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=1,299,072,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6767/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,299,264,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6768/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,299,456,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6769/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=1,299,648,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6770/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=1,299,840,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6771/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,300,032,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6772/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,300,224,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6773/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,300,416,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6774/500000] + train/ActionL1Loss=0.0587 + throughput/total_tokens=1,300,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6775/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,300,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6776/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,300,992,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6777/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=1,301,184,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6778/500000] + train/ActionL1Loss=0.0690 + throughput/total_tokens=1,301,376,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6779/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=1,301,568,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6780/500000] + optim/total_grad_norm=9.647 + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,301,760,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6781/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=1,301,952,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6782/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=1,302,144,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6783/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,302,336,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6784/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,302,528,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6785/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,302,720,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6786/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,302,912,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6787/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,303,104,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6788/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,303,296,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6789/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,303,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6790/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=1,303,680,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6791/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,303,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6792/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=1,304,064,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6793/500000] + train/ActionL1Loss=0.0289 + throughput/total_tokens=1,304,256,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6794/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=1,304,448,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6795/500000] + train/ActionL1Loss=0.0627 + throughput/total_tokens=1,304,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6796/500000] + train/ActionL1Loss=0.0615 + throughput/total_tokens=1,304,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6797/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=1,305,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6798/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,305,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6799/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,305,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6800/500000] + optim/total_grad_norm=8.814 + train/ActionL1Loss=0.0533 + throughput/total_tokens=1,305,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +wandb: WARNING A graphql request initiated by the public wandb API timed out (timeout=19 sec). Create a new API with an integer timeout larger than 19, e.g., `api = wandb.Api(timeout=29)` to increase the graphql timeout. +[step=6801/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=1,305,792,000 + throughput/device/tokens_per_second=1,119 + throughput/device/batches_per_second=0.0466 +[step=6802/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,305,984,000 + throughput/device/tokens_per_second=1,118 + throughput/device/batches_per_second=0.0466 +[step=6803/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=1,306,176,000 + throughput/device/tokens_per_second=1,118 + throughput/device/batches_per_second=0.0466 +[step=6804/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,306,368,000 + throughput/device/tokens_per_second=1,118 + throughput/device/batches_per_second=0.0466 +[step=6805/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,306,560,000 + throughput/device/tokens_per_second=1,118 + throughput/device/batches_per_second=0.0466 +[step=6806/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,306,752,000 + throughput/device/tokens_per_second=1,119 + throughput/device/batches_per_second=0.0466 +[step=6807/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=1,306,944,000 + throughput/device/tokens_per_second=1,120 + throughput/device/batches_per_second=0.0467 +[step=6808/500000] + train/ActionL1Loss=0.0624 + throughput/total_tokens=1,307,136,000 + throughput/device/tokens_per_second=1,121 + throughput/device/batches_per_second=0.0467 +[step=6809/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=1,307,328,000 + throughput/device/tokens_per_second=1,121 + throughput/device/batches_per_second=0.0467 +[step=6810/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,307,520,000 + throughput/device/tokens_per_second=1,120 + throughput/device/batches_per_second=0.0467 + System/Peak GPU Memory (MB)=46,924 +[step=6811/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,307,712,000 + throughput/device/tokens_per_second=1,121 + throughput/device/batches_per_second=0.0467 +[step=6812/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=1,307,904,000 + throughput/device/tokens_per_second=1,121 + throughput/device/batches_per_second=0.0467 +[step=6813/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=1,308,096,000 + throughput/device/tokens_per_second=1,121 + throughput/device/batches_per_second=0.0467 +[step=6814/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,308,288,000 + throughput/device/tokens_per_second=1,121 + throughput/device/batches_per_second=0.0467 +[step=6815/500000] + train/ActionL1Loss=0.0291 + throughput/total_tokens=1,308,480,000 + throughput/device/tokens_per_second=1,120 + throughput/device/batches_per_second=0.0467 +[step=6816/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,308,672,000 + throughput/device/tokens_per_second=1,120 + throughput/device/batches_per_second=0.0467 +[step=6817/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=1,308,864,000 + throughput/device/tokens_per_second=1,121 + throughput/device/batches_per_second=0.0467 +[step=6818/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,309,056,000 + throughput/device/tokens_per_second=1,121 + throughput/device/batches_per_second=0.0467 +[step=6819/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,309,248,000 + throughput/device/tokens_per_second=1,121 + throughput/device/batches_per_second=0.0467 +[step=6820/500000] + optim/total_grad_norm=6.654 + train/ActionL1Loss=0.0354 + throughput/total_tokens=1,309,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6821/500000] + train/ActionL1Loss=0.0331 + throughput/total_tokens=1,309,632,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6822/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,309,824,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6823/500000] + train/ActionL1Loss=0.0619 + throughput/total_tokens=1,310,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6824/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=1,310,208,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6825/500000] + train/ActionL1Loss=0.0298 + throughput/total_tokens=1,310,400,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6826/500000] + train/ActionL1Loss=0.0279 + throughput/total_tokens=1,310,592,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6827/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=1,310,784,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6828/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,310,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6829/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,311,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6830/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,311,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6831/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=1,311,552,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6832/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=1,311,744,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6833/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,311,936,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6834/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,312,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6835/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=1,312,320,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6836/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,312,512,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6837/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,312,704,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6838/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,312,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6839/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=1,313,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6840/500000] + optim/total_grad_norm=8.506 + train/ActionL1Loss=0.0645 + throughput/total_tokens=1,313,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6841/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,313,472,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6842/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=1,313,664,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6843/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,313,856,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6844/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,314,048,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6845/500000] + train/ActionL1Loss=0.0584 + throughput/total_tokens=1,314,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6846/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=1,314,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6847/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=1,314,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6848/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,314,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6849/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=1,315,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6850/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=1,315,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6851/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,315,392,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6852/500000] + train/ActionL1Loss=0.0616 + throughput/total_tokens=1,315,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6853/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=1,315,776,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6854/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=1,315,968,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6855/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,316,160,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6856/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,316,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6857/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,316,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6858/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,316,736,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6859/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=1,316,928,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6860/500000] + optim/total_grad_norm=8.582 + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,317,120,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=6861/500000] + train/ActionL1Loss=0.0615 + throughput/total_tokens=1,317,312,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6862/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,317,504,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6863/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,317,696,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6864/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,317,888,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6865/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=1,318,080,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6866/500000] + train/ActionL1Loss=0.0343 + throughput/total_tokens=1,318,272,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6867/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,318,464,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6868/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,318,656,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=6869/500000] + train/ActionL1Loss=0.0349 + throughput/total_tokens=1,318,848,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6870/500000] + train/ActionL1Loss=0.0390 + throughput/total_tokens=1,319,040,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=6871/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=1,319,232,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6872/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,319,424,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6873/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,319,616,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6874/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,319,808,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6875/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=1,320,000,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6876/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,320,192,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6877/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,320,384,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6878/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,320,576,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6879/500000] + train/ActionL1Loss=0.0641 + throughput/total_tokens=1,320,768,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6880/500000] + optim/total_grad_norm=9.479 + train/ActionL1Loss=0.0456 + throughput/total_tokens=1,320,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6881/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=1,321,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6882/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,321,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6883/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=1,321,536,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6884/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,321,728,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6885/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,321,920,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6886/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=1,322,112,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6887/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=1,322,304,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6888/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,322,496,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6889/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,322,688,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6890/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,322,880,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6891/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=1,323,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6892/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,323,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6893/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,323,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6894/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=1,323,648,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6895/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=1,323,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6896/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=1,324,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6897/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=1,324,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6898/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=1,324,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6899/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=1,324,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6900/500000] + optim/total_grad_norm=7.260 + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,324,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6901/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,324,992,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6902/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=1,325,184,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6903/500000] + train/ActionL1Loss=0.0322 + throughput/total_tokens=1,325,376,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6904/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=1,325,568,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6905/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,325,760,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6906/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=1,325,952,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6907/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,326,144,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6908/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,326,336,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6909/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=1,326,528,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6910/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,326,720,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6911/500000] + train/ActionL1Loss=0.0660 + throughput/total_tokens=1,326,912,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6912/500000] + train/ActionL1Loss=0.0353 + throughput/total_tokens=1,327,104,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6913/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=1,327,296,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6914/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=1,327,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6915/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=1,327,680,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6916/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,327,872,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6917/500000] + train/ActionL1Loss=0.0369 + throughput/total_tokens=1,328,064,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6918/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=1,328,256,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6919/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,328,448,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6920/500000] + optim/total_grad_norm=7.980 + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,328,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6921/500000] + train/ActionL1Loss=0.0394 + throughput/total_tokens=1,328,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6922/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=1,329,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6923/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,329,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6924/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=1,329,408,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6925/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=1,329,600,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6926/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=1,329,792,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6927/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,329,984,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6928/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=1,330,176,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6929/500000] + train/ActionL1Loss=0.0349 + throughput/total_tokens=1,330,368,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6930/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,330,560,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=6931/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,330,752,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6932/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,330,944,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6933/500000] + train/ActionL1Loss=0.0674 + throughput/total_tokens=1,331,136,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6934/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=1,331,328,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6935/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,331,520,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6936/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=1,331,712,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6937/500000] + train/ActionL1Loss=0.0336 + throughput/total_tokens=1,331,904,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6938/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=1,332,096,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6939/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=1,332,288,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6940/500000] + optim/total_grad_norm=7.808 + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,332,480,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6941/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=1,332,672,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6942/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,332,864,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6943/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=1,333,056,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6944/500000] + train/ActionL1Loss=0.0677 + throughput/total_tokens=1,333,248,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6945/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,333,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6946/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,333,632,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6947/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,333,824,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6948/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=1,334,016,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6949/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=1,334,208,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=6950/500000] + train/ActionL1Loss=0.0311 + throughput/total_tokens=1,334,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=6951/500000] + train/ActionL1Loss=0.0300 + throughput/total_tokens=1,334,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6952/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,334,784,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6953/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=1,334,976,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6954/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=1,335,168,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6955/500000] + train/ActionL1Loss=0.0631 + throughput/total_tokens=1,335,360,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=6956/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,335,552,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=6957/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,335,744,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=6958/500000] + train/ActionL1Loss=0.0631 + throughput/total_tokens=1,335,936,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=6959/500000] + train/ActionL1Loss=0.0611 + throughput/total_tokens=1,336,128,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=6960/500000] + optim/total_grad_norm=7.541 + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,336,320,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=6961/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=1,336,512,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6962/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=1,336,704,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=6963/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,336,896,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=6964/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=1,337,088,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=6965/500000] + train/ActionL1Loss=0.0647 + throughput/total_tokens=1,337,280,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=6966/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=1,337,472,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=6967/500000] + train/ActionL1Loss=0.0710 + throughput/total_tokens=1,337,664,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=6968/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,337,856,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=6969/500000] + train/ActionL1Loss=0.0660 + throughput/total_tokens=1,338,048,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=6970/500000] + train/ActionL1Loss=0.0674 + throughput/total_tokens=1,338,240,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=6971/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,338,432,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6972/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=1,338,624,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6973/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,338,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6974/500000] + train/ActionL1Loss=0.0664 + throughput/total_tokens=1,339,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6975/500000] + train/ActionL1Loss=0.0229 + throughput/total_tokens=1,339,200,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6976/500000] + train/ActionL1Loss=0.0331 + throughput/total_tokens=1,339,392,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6977/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,339,584,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6978/500000] + train/ActionL1Loss=0.0618 + throughput/total_tokens=1,339,776,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6979/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,339,968,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6980/500000] + optim/total_grad_norm=8.388 + train/ActionL1Loss=0.0400 + throughput/total_tokens=1,340,160,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=6981/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,340,352,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6982/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,340,544,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6983/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,340,736,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=6984/500000] + train/ActionL1Loss=0.0387 + throughput/total_tokens=1,340,928,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6985/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=1,341,120,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=6986/500000] + train/ActionL1Loss=0.0336 + throughput/total_tokens=1,341,312,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6987/500000] + train/ActionL1Loss=0.0321 + throughput/total_tokens=1,341,504,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=6988/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,341,696,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6989/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,341,888,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6990/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,342,080,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=6991/500000] + train/ActionL1Loss=0.0588 + throughput/total_tokens=1,342,272,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6992/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=1,342,464,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6993/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,342,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=6994/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,342,848,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=6995/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,343,040,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6996/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,343,232,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6997/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,343,424,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6998/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,343,616,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=6999/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,343,808,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7000/500000] + optim/total_grad_norm=7.922 + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,344,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +10/13 [09:22:26] INFO | >> Saving config... checkpoint.py:608 +10/13 [09:22:58] INFO | >> Saving model state... checkpoint.py:796 +10/13 [09:24:09] INFO | >> Saving optim state... checkpoint.py:811 +10/13 [09:25:41] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=7001/500000] + train/ActionL1Loss=0.0700 + throughput/total_tokens=1,344,192,000 + throughput/device/tokens_per_second=1,217 + throughput/device/batches_per_second=0.0507 +[step=7002/500000] + train/ActionL1Loss=0.0364 + throughput/total_tokens=1,344,384,000 + throughput/device/tokens_per_second=1,194 + throughput/device/batches_per_second=0.0498 +[step=7003/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=1,344,576,000 + throughput/device/tokens_per_second=1,186 + throughput/device/batches_per_second=0.0494 +[step=7004/500000] + train/ActionL1Loss=0.0607 + throughput/total_tokens=1,344,768,000 + throughput/device/tokens_per_second=1,185 + throughput/device/batches_per_second=0.0494 +[step=7005/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=1,344,960,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=7006/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,345,152,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=7007/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,345,344,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=7008/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,345,536,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7009/500000] + train/ActionL1Loss=0.0331 + throughput/total_tokens=1,345,728,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7010/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,345,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7011/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=1,346,112,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7012/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,346,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7013/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=1,346,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7014/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=1,346,688,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7015/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,346,880,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7016/500000] + train/ActionL1Loss=0.0335 + throughput/total_tokens=1,347,072,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7017/500000] + train/ActionL1Loss=0.0335 + throughput/total_tokens=1,347,264,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7018/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=1,347,456,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7019/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,347,648,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=7020/500000] + optim/total_grad_norm=8.196 + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,347,840,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=7021/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,348,032,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7022/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=1,348,224,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7023/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,348,416,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7024/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=1,348,608,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7025/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,348,800,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7026/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=1,348,992,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7027/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=1,349,184,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7028/500000] + train/ActionL1Loss=0.0606 + throughput/total_tokens=1,349,376,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7029/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,349,568,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7030/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=1,349,760,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7031/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=1,349,952,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7032/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=1,350,144,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7033/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,350,336,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7034/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=1,350,528,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7035/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=1,350,720,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7036/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=1,350,912,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7037/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,351,104,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7038/500000] + train/ActionL1Loss=0.0306 + throughput/total_tokens=1,351,296,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7039/500000] + train/ActionL1Loss=0.0606 + throughput/total_tokens=1,351,488,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7040/500000] + optim/total_grad_norm=7.885 + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,351,680,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7041/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,351,872,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7042/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,352,064,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7043/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,352,256,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7044/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,352,448,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7045/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,352,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7046/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=1,352,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7047/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=1,353,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7048/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=1,353,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7049/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,353,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7050/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=1,353,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7051/500000] + train/ActionL1Loss=0.0331 + throughput/total_tokens=1,353,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7052/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=1,353,984,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7053/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=1,354,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7054/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,354,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7055/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=1,354,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7056/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,354,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7057/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=1,354,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7058/500000] + train/ActionL1Loss=0.0320 + throughput/total_tokens=1,355,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7059/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,355,328,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7060/500000] + optim/total_grad_norm=8.317 + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,355,520,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7061/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,355,712,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7062/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,355,904,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7063/500000] + train/ActionL1Loss=0.0284 + throughput/total_tokens=1,356,096,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7064/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=1,356,288,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7065/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,356,480,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7066/500000] + train/ActionL1Loss=0.0297 + throughput/total_tokens=1,356,672,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7067/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=1,356,864,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7068/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,357,056,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7069/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=1,357,248,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7070/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=1,357,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7071/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,357,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7072/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,357,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7073/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=1,358,016,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7074/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=1,358,208,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7075/500000] + train/ActionL1Loss=0.0390 + throughput/total_tokens=1,358,400,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7076/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=1,358,592,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7077/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,358,784,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7078/500000] + train/ActionL1Loss=0.0372 + throughput/total_tokens=1,358,976,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7079/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,359,168,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7080/500000] + optim/total_grad_norm=10.09 + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,359,360,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7081/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=1,359,552,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7082/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=1,359,744,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7083/500000] + train/ActionL1Loss=0.0644 + throughput/total_tokens=1,359,936,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7084/500000] + train/ActionL1Loss=0.0616 + throughput/total_tokens=1,360,128,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7085/500000] + train/ActionL1Loss=0.0628 + throughput/total_tokens=1,360,320,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7086/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=1,360,512,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7087/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,360,704,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7088/500000] + train/ActionL1Loss=0.0341 + throughput/total_tokens=1,360,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7089/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,361,088,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7090/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,361,280,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7091/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=1,361,472,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7092/500000] + train/ActionL1Loss=0.0356 + throughput/total_tokens=1,361,664,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7093/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=1,361,856,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7094/500000] + train/ActionL1Loss=0.0390 + throughput/total_tokens=1,362,048,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7095/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,362,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7096/500000] + train/ActionL1Loss=0.0289 + throughput/total_tokens=1,362,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7097/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=1,362,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7098/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=1,362,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7099/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=1,363,008,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7100/500000] + optim/total_grad_norm=10.38 + train/ActionL1Loss=0.0629 + throughput/total_tokens=1,363,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7101/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,363,392,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7102/500000] + train/ActionL1Loss=0.0304 + throughput/total_tokens=1,363,584,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7103/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=1,363,776,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7104/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,363,968,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=7105/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,364,160,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=7106/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,364,352,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=7107/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,364,544,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=7108/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=1,364,736,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=7109/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,364,928,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=7110/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,365,120,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 + System/Peak GPU Memory (MB)=46,924 +[step=7111/500000] + train/ActionL1Loss=0.0656 + throughput/total_tokens=1,365,312,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=7112/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,365,504,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=7113/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,365,696,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=7114/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=1,365,888,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=7115/500000] + train/ActionL1Loss=0.0588 + throughput/total_tokens=1,366,080,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=7116/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,366,272,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7117/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,366,464,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7118/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,366,656,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7119/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,366,848,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7120/500000] + optim/total_grad_norm=9.359 + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,367,040,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7121/500000] + train/ActionL1Loss=0.0629 + throughput/total_tokens=1,367,232,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7122/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=1,367,424,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7123/500000] + train/ActionL1Loss=0.0322 + throughput/total_tokens=1,367,616,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7124/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=1,367,808,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7125/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=1,368,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7126/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,368,192,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7127/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=1,368,384,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7128/500000] + train/ActionL1Loss=0.0562 + throughput/total_tokens=1,368,576,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7129/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=1,368,768,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7130/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,368,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7131/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=1,369,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7132/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,369,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7133/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,369,536,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7134/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,369,728,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7135/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=1,369,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7136/500000] + train/ActionL1Loss=0.0327 + throughput/total_tokens=1,370,112,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7137/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,370,304,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7138/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=1,370,496,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7139/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=1,370,688,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7140/500000] + optim/total_grad_norm=9.205 + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,370,880,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7141/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,371,072,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7142/500000] + train/ActionL1Loss=0.0351 + throughput/total_tokens=1,371,264,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7143/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=1,371,456,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7144/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=1,371,648,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7145/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,371,840,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7146/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=1,372,032,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7147/500000] + train/ActionL1Loss=0.0657 + throughput/total_tokens=1,372,224,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7148/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=1,372,416,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7149/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,372,608,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7150/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=1,372,800,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7151/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=1,372,992,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7152/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=1,373,184,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7153/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,373,376,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7154/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,373,568,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7155/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=1,373,760,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7156/500000] + train/ActionL1Loss=0.0641 + throughput/total_tokens=1,373,952,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7157/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=1,374,144,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7158/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,374,336,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7159/500000] + train/ActionL1Loss=0.0373 + throughput/total_tokens=1,374,528,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7160/500000] + optim/total_grad_norm=8.193 + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,374,720,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7161/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,374,912,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7162/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,375,104,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7163/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,375,296,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7164/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=1,375,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7165/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=1,375,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7166/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,375,872,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7167/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,376,064,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7168/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=1,376,256,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7169/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=1,376,448,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7170/500000] + train/ActionL1Loss=0.0307 + throughput/total_tokens=1,376,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7171/500000] + train/ActionL1Loss=0.0373 + throughput/total_tokens=1,376,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7172/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,377,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7173/500000] + train/ActionL1Loss=0.0390 + throughput/total_tokens=1,377,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7174/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=1,377,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7175/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=1,377,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7176/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=1,377,792,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7177/500000] + train/ActionL1Loss=0.0338 + throughput/total_tokens=1,377,984,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7178/500000] + train/ActionL1Loss=0.0757 + throughput/total_tokens=1,378,176,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7179/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=1,378,368,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7180/500000] + optim/total_grad_norm=8.086 + train/ActionL1Loss=0.0511 + throughput/total_tokens=1,378,560,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7181/500000] + train/ActionL1Loss=0.0558 + throughput/total_tokens=1,378,752,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7182/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=1,378,944,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7183/500000] + train/ActionL1Loss=0.0319 + throughput/total_tokens=1,379,136,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7184/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=1,379,328,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7185/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,379,520,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7186/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=1,379,712,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7187/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,379,904,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7188/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,380,096,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7189/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,380,288,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7190/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,380,480,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7191/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=1,380,672,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7192/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=1,380,864,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=7193/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,381,056,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=7194/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,381,248,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7195/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,381,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7196/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,381,632,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7197/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=1,381,824,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7198/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,382,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7199/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,382,208,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7200/500000] + optim/total_grad_norm=9.788 + train/ActionL1Loss=0.0660 + throughput/total_tokens=1,382,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7201/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=1,382,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7202/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=1,382,784,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7203/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,382,976,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7204/500000] + train/ActionL1Loss=0.0622 + throughput/total_tokens=1,383,168,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7205/500000] + train/ActionL1Loss=0.0623 + throughput/total_tokens=1,383,360,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7206/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=1,383,552,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7207/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,383,744,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7208/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=1,383,936,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7209/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,384,128,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7210/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,384,320,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7211/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,384,512,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7212/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=1,384,704,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7213/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,384,896,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7214/500000] + train/ActionL1Loss=0.0640 + throughput/total_tokens=1,385,088,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7215/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=1,385,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7216/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=1,385,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7217/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,385,664,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7218/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,385,856,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7219/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=1,386,048,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7220/500000] + optim/total_grad_norm=9.024 + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,386,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7221/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=1,386,432,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7222/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=1,386,624,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7223/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,386,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7224/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,387,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7225/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,387,200,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7226/500000] + train/ActionL1Loss=0.0286 + throughput/total_tokens=1,387,392,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7227/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,387,584,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7228/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=1,387,776,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7229/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,387,968,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7230/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,388,160,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7231/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=1,388,352,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7232/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,388,544,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7233/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=1,388,736,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7234/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,388,928,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7235/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,389,120,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7236/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=1,389,312,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7237/500000] + train/ActionL1Loss=0.0353 + throughput/total_tokens=1,389,504,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7238/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=1,389,696,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7239/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,389,888,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7240/500000] + optim/total_grad_norm=10.57 + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,390,080,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7241/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=1,390,272,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7242/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,390,464,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7243/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=1,390,656,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7244/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,390,848,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7245/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,391,040,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7246/500000] + train/ActionL1Loss=0.0558 + throughput/total_tokens=1,391,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7247/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=1,391,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7248/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,391,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7249/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,391,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7250/500000] + train/ActionL1Loss=0.0766 + throughput/total_tokens=1,392,000,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7251/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,392,192,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7252/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=1,392,384,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7253/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,392,576,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7254/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,392,768,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7255/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,392,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7256/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=1,393,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7257/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=1,393,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7258/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=1,393,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7259/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,393,728,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7260/500000] + optim/total_grad_norm=7.131 + train/ActionL1Loss=0.0417 + throughput/total_tokens=1,393,920,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7261/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,394,112,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7262/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,394,304,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7263/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,394,496,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7264/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,394,688,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7265/500000] + train/ActionL1Loss=0.0394 + throughput/total_tokens=1,394,880,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7266/500000] + train/ActionL1Loss=0.0347 + throughput/total_tokens=1,395,072,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7267/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=1,395,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7268/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=1,395,456,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7269/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=1,395,648,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7270/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,395,840,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7271/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,396,032,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7272/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=1,396,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7273/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=1,396,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7274/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,396,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7275/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,396,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7276/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=1,396,992,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7277/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,397,184,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7278/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=1,397,376,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7279/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=1,397,568,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7280/500000] + optim/total_grad_norm=9.731 + train/ActionL1Loss=0.0583 + throughput/total_tokens=1,397,760,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7281/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,397,952,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7282/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=1,398,144,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7283/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=1,398,336,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7284/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=1,398,528,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7285/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,398,720,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7286/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=1,398,912,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7287/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=1,399,104,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7288/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,399,296,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7289/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=1,399,488,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7290/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=1,399,680,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7291/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=1,399,872,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7292/500000] + train/ActionL1Loss=0.0298 + throughput/total_tokens=1,400,064,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7293/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=1,400,256,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7294/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=1,400,448,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7295/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=1,400,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7296/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,400,832,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7297/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,401,024,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7298/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,401,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7299/500000] + train/ActionL1Loss=0.0394 + throughput/total_tokens=1,401,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7300/500000] + optim/total_grad_norm=7.672 + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,401,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7301/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=1,401,792,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7302/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,401,984,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7303/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,402,176,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7304/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=1,402,368,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7305/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,402,560,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7306/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,402,752,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7307/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,402,944,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=7308/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=1,403,136,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7309/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=1,403,328,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7310/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,403,520,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7311/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=1,403,712,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7312/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=1,403,904,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7313/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,404,096,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7314/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,404,288,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7315/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,404,480,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7316/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,404,672,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7317/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,404,864,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7318/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=1,405,056,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7319/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,405,248,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7320/500000] + optim/total_grad_norm=8.850 + train/ActionL1Loss=0.0562 + throughput/total_tokens=1,405,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7321/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,405,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7322/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=1,405,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7323/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,406,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7324/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,406,208,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7325/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,406,400,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7326/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,406,592,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7327/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,406,784,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7328/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=1,406,976,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7329/500000] + train/ActionL1Loss=0.0681 + throughput/total_tokens=1,407,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7330/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=1,407,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7331/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,407,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7332/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=1,407,744,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7333/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,407,936,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7334/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,408,128,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7335/500000] + train/ActionL1Loss=0.0640 + throughput/total_tokens=1,408,320,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7336/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,408,512,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7337/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,408,704,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7338/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,408,896,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7339/500000] + train/ActionL1Loss=0.0344 + throughput/total_tokens=1,409,088,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7340/500000] + optim/total_grad_norm=8.668 + train/ActionL1Loss=0.0501 + throughput/total_tokens=1,409,280,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7341/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,409,472,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7342/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=1,409,664,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7343/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,409,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7344/500000] + train/ActionL1Loss=0.0351 + throughput/total_tokens=1,410,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7345/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=1,410,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7346/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,410,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7347/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,410,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7348/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=1,410,816,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7349/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,411,008,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7350/500000] + train/ActionL1Loss=0.0343 + throughput/total_tokens=1,411,200,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7351/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,411,392,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7352/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,411,584,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7353/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,411,776,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7354/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=1,411,968,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7355/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,412,160,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7356/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=1,412,352,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7357/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,412,544,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7358/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,412,736,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7359/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,412,928,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7360/500000] + optim/total_grad_norm=8.549 + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,413,120,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=7361/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=1,413,312,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7362/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,413,504,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7363/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,413,696,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7364/500000] + train/ActionL1Loss=0.0295 + throughput/total_tokens=1,413,888,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7365/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,414,080,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=7366/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=1,414,272,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7367/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=1,414,464,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7368/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,414,656,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7369/500000] + train/ActionL1Loss=0.0331 + throughput/total_tokens=1,414,848,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7370/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=1,415,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7371/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,415,232,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7372/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=1,415,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7373/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,415,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7374/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=1,415,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7375/500000] + train/ActionL1Loss=0.0281 + throughput/total_tokens=1,416,000,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7376/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,416,192,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7377/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=1,416,384,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7378/500000] + train/ActionL1Loss=0.0690 + throughput/total_tokens=1,416,576,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7379/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,416,768,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7380/500000] + optim/total_grad_norm=8.694 + train/ActionL1Loss=0.0607 + throughput/total_tokens=1,416,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7381/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,417,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7382/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,417,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7383/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=1,417,536,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7384/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,417,728,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7385/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,417,920,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7386/500000] + train/ActionL1Loss=0.0310 + throughput/total_tokens=1,418,112,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7387/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,418,304,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7388/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=1,418,496,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7389/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=1,418,688,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7390/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,418,880,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7391/500000] + train/ActionL1Loss=0.0601 + throughput/total_tokens=1,419,072,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7392/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=1,419,264,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7393/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,419,456,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7394/500000] + train/ActionL1Loss=0.0369 + throughput/total_tokens=1,419,648,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7395/500000] + train/ActionL1Loss=0.0372 + throughput/total_tokens=1,419,840,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7396/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=1,420,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7397/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=1,420,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7398/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=1,420,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7399/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,420,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7400/500000] + optim/total_grad_norm=8.439 + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,420,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7401/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=1,420,992,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7402/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=1,421,184,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7403/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,421,376,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7404/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=1,421,568,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7405/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,421,760,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7406/500000] + train/ActionL1Loss=0.0693 + throughput/total_tokens=1,421,952,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7407/500000] + train/ActionL1Loss=0.0251 + throughput/total_tokens=1,422,144,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7408/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,422,336,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7409/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,422,528,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7410/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=1,422,720,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7411/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,422,912,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7412/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,423,104,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7413/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=1,423,296,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7414/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=1,423,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7415/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=1,423,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7416/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=1,423,872,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7417/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,424,064,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7418/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=1,424,256,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7419/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,424,448,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7420/500000] + optim/total_grad_norm=8.574 + train/ActionL1Loss=0.0334 + throughput/total_tokens=1,424,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7421/500000] + train/ActionL1Loss=0.0342 + throughput/total_tokens=1,424,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7422/500000] + train/ActionL1Loss=0.0358 + throughput/total_tokens=1,425,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7423/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,425,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7424/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,425,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7425/500000] + train/ActionL1Loss=0.0341 + throughput/total_tokens=1,425,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7426/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,425,792,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7427/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,425,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7428/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=1,426,176,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7429/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=1,426,368,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7430/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,426,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7431/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=1,426,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7432/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,426,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7433/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,427,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7434/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,427,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7435/500000] + train/ActionL1Loss=0.0369 + throughput/total_tokens=1,427,520,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7436/500000] + train/ActionL1Loss=0.0282 + throughput/total_tokens=1,427,712,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7437/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=1,427,904,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7438/500000] + train/ActionL1Loss=0.0658 + throughput/total_tokens=1,428,096,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7439/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,428,288,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7440/500000] + optim/total_grad_norm=7.594 + train/ActionL1Loss=0.0354 + throughput/total_tokens=1,428,480,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7441/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=1,428,672,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7442/500000] + train/ActionL1Loss=0.0283 + throughput/total_tokens=1,428,864,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7443/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,429,056,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7444/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,429,248,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7445/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,429,440,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7446/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,429,632,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7447/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,429,824,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7448/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,430,016,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7449/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=1,430,208,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7450/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,430,400,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7451/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,430,592,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7452/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,430,784,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7453/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=1,430,976,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7454/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,431,168,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7455/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=1,431,360,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7456/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,431,552,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7457/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,431,744,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7458/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,431,936,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7459/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=1,432,128,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7460/500000] + optim/total_grad_norm=7.931 + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,432,320,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=7461/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=1,432,512,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7462/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=1,432,704,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7463/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,432,896,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=7464/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=1,433,088,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7465/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,433,280,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=7466/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,433,472,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=7467/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,433,664,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=7468/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=1,433,856,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7469/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=1,434,048,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7470/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,434,240,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7471/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,434,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7472/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,434,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7473/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,434,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7474/500000] + train/ActionL1Loss=0.0345 + throughput/total_tokens=1,435,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7475/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,435,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7476/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,435,392,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7477/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,435,584,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7478/500000] + train/ActionL1Loss=0.0373 + throughput/total_tokens=1,435,776,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7479/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=1,435,968,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7480/500000] + optim/total_grad_norm=8.845 + train/ActionL1Loss=0.0366 + throughput/total_tokens=1,436,160,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7481/500000] + train/ActionL1Loss=0.0333 + throughput/total_tokens=1,436,352,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7482/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=1,436,544,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7483/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,436,736,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7484/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,436,928,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7485/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=1,437,120,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7486/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,437,312,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7487/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=1,437,504,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7488/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,437,696,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7489/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=1,437,888,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7490/500000] + train/ActionL1Loss=0.0312 + throughput/total_tokens=1,438,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7491/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=1,438,272,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7492/500000] + train/ActionL1Loss=0.0316 + throughput/total_tokens=1,438,464,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7493/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,438,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7494/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=1,438,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7495/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=1,439,040,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7496/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=1,439,232,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7497/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,439,424,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7498/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,439,616,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7499/500000] + train/ActionL1Loss=0.0225 + throughput/total_tokens=1,439,808,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7500/500000] + optim/total_grad_norm=9.019 + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,440,000,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +10/13 [12:16:58] INFO | >> Saving config... checkpoint.py:608 +10/13 [12:17:29] INFO | >> Saving model state... checkpoint.py:796 +10/13 [12:18:41] INFO | >> Saving optim state... checkpoint.py:811 +10/13 [12:20:12] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=7501/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=1,440,192,000 + throughput/device/tokens_per_second=1,214 + throughput/device/batches_per_second=0.0506 +[step=7502/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,440,384,000 + throughput/device/tokens_per_second=1,195 + throughput/device/batches_per_second=0.0498 +[step=7503/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,440,576,000 + throughput/device/tokens_per_second=1,190 + throughput/device/batches_per_second=0.0496 +[step=7504/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,440,768,000 + throughput/device/tokens_per_second=1,186 + throughput/device/batches_per_second=0.0494 +[step=7505/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,440,960,000 + throughput/device/tokens_per_second=1,184 + throughput/device/batches_per_second=0.0494 +[step=7506/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=1,441,152,000 + throughput/device/tokens_per_second=1,184 + throughput/device/batches_per_second=0.0493 +[step=7507/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=1,441,344,000 + throughput/device/tokens_per_second=1,184 + throughput/device/batches_per_second=0.0493 +[step=7508/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,441,536,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=7509/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=1,441,728,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=7510/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,441,920,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=7511/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,442,112,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=7512/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=1,442,304,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=7513/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,442,496,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=7514/500000] + train/ActionL1Loss=0.0660 + throughput/total_tokens=1,442,688,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=7515/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=1,442,880,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=7516/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,443,072,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=7517/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,443,264,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=7518/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=1,443,456,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=7519/500000] + train/ActionL1Loss=0.0611 + throughput/total_tokens=1,443,648,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=7520/500000] + optim/total_grad_norm=8.878 + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,443,840,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7521/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,444,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7522/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,444,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7523/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,444,416,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7524/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,444,608,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7525/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,444,800,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7526/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,444,992,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7527/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=1,445,184,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7528/500000] + train/ActionL1Loss=0.0293 + throughput/total_tokens=1,445,376,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7529/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=1,445,568,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7530/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,445,760,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7531/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,445,952,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7532/500000] + train/ActionL1Loss=0.0698 + throughput/total_tokens=1,446,144,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7533/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,446,336,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7534/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=1,446,528,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7535/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,446,720,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7536/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,446,912,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7537/500000] + train/ActionL1Loss=0.0307 + throughput/total_tokens=1,447,104,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7538/500000] + train/ActionL1Loss=0.0288 + throughput/total_tokens=1,447,296,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7539/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=1,447,488,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7540/500000] + optim/total_grad_norm=7.183 + train/ActionL1Loss=0.0498 + throughput/total_tokens=1,447,680,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7541/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=1,447,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7542/500000] + train/ActionL1Loss=0.0314 + throughput/total_tokens=1,448,064,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7543/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,448,256,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7544/500000] + train/ActionL1Loss=0.0394 + throughput/total_tokens=1,448,448,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7545/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,448,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7546/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,448,832,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7547/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=1,449,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7548/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,449,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7549/500000] + train/ActionL1Loss=0.0317 + throughput/total_tokens=1,449,408,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7550/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=1,449,600,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7551/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,449,792,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7552/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,449,984,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7553/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,450,176,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7554/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,450,368,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7555/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,450,560,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7556/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=1,450,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7557/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,450,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7558/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=1,451,136,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7559/500000] + train/ActionL1Loss=0.0340 + throughput/total_tokens=1,451,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7560/500000] + optim/total_grad_norm=7.855 + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,451,520,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7561/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,451,712,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7562/500000] + train/ActionL1Loss=0.0562 + throughput/total_tokens=1,451,904,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7563/500000] + train/ActionL1Loss=0.0346 + throughput/total_tokens=1,452,096,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7564/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=1,452,288,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7565/500000] + train/ActionL1Loss=0.0327 + throughput/total_tokens=1,452,480,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7566/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,452,672,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7567/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,452,864,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7568/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=1,453,056,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7569/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,453,248,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7570/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,453,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7571/500000] + train/ActionL1Loss=0.0334 + throughput/total_tokens=1,453,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7572/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=1,453,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7573/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=1,454,016,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7574/500000] + train/ActionL1Loss=0.0269 + throughput/total_tokens=1,454,208,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7575/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=1,454,400,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7576/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=1,454,592,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7577/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=1,454,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7578/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=1,454,976,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7579/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,455,168,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7580/500000] + optim/total_grad_norm=6.877 + train/ActionL1Loss=0.0401 + throughput/total_tokens=1,455,360,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7581/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,455,552,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7582/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,455,744,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7583/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,455,936,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7584/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=1,456,128,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7585/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=1,456,320,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7586/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,456,512,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7587/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,456,704,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7588/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,456,896,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7589/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,457,088,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7590/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,457,280,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7591/500000] + train/ActionL1Loss=0.0631 + throughput/total_tokens=1,457,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7592/500000] + train/ActionL1Loss=0.0314 + throughput/total_tokens=1,457,664,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7593/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,457,856,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7594/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=1,458,048,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7595/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=1,458,240,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7596/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,458,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7597/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,458,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7598/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=1,458,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7599/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,459,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7600/500000] + optim/total_grad_norm=6.768 + train/ActionL1Loss=0.0480 + throughput/total_tokens=1,459,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7601/500000] + train/ActionL1Loss=0.0661 + throughput/total_tokens=1,459,392,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7602/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,459,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7603/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,459,776,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7604/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,459,968,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7605/500000] + train/ActionL1Loss=0.0364 + throughput/total_tokens=1,460,160,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7606/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=1,460,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7607/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,460,544,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7608/500000] + train/ActionL1Loss=0.0345 + throughput/total_tokens=1,460,736,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7609/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=1,460,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7610/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,461,120,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7611/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,461,312,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7612/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,461,504,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7613/500000] + train/ActionL1Loss=0.0348 + throughput/total_tokens=1,461,696,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7614/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,461,888,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7615/500000] + train/ActionL1Loss=0.0662 + throughput/total_tokens=1,462,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7616/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,462,272,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7617/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=1,462,464,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7618/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,462,656,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7619/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=1,462,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7620/500000] + optim/total_grad_norm=7.395 + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,463,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7621/500000] + train/ActionL1Loss=0.0309 + throughput/total_tokens=1,463,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7622/500000] + train/ActionL1Loss=0.0623 + throughput/total_tokens=1,463,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7623/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=1,463,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7624/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=1,463,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7625/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,464,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7626/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=1,464,192,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7627/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,464,384,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7628/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,464,576,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7629/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,464,768,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7630/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,464,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7631/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,465,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7632/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=1,465,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7633/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,465,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7634/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,465,728,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7635/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,465,920,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7636/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,466,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7637/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,466,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7638/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,466,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7639/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=1,466,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7640/500000] + optim/total_grad_norm=9.811 + train/ActionL1Loss=0.0622 + throughput/total_tokens=1,466,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7641/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,467,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7642/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,467,264,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7643/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,467,456,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7644/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,467,648,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7645/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,467,840,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7646/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=1,468,032,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7647/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=1,468,224,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7648/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,468,416,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7649/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,468,608,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7650/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,468,800,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7651/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,468,992,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=7652/500000] + train/ActionL1Loss=0.0305 + throughput/total_tokens=1,469,184,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7653/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,469,376,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7654/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,469,568,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7655/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=1,469,760,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7656/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=1,469,952,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7657/500000] + train/ActionL1Loss=0.0309 + throughput/total_tokens=1,470,144,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7658/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=1,470,336,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7659/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=1,470,528,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7660/500000] + optim/total_grad_norm=5.717 + train/ActionL1Loss=0.0445 + throughput/total_tokens=1,470,720,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=7661/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=1,470,912,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7662/500000] + train/ActionL1Loss=0.0297 + throughput/total_tokens=1,471,104,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=7663/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=1,471,296,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=7664/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=1,471,488,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=7665/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,471,680,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7666/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,471,872,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=7667/500000] + train/ActionL1Loss=0.0617 + throughput/total_tokens=1,472,064,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7668/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=1,472,256,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=7669/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,472,448,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=7670/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=1,472,640,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7671/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=1,472,832,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7672/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=1,473,024,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7673/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=1,473,216,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7674/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,473,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7675/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,473,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7676/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,473,792,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7677/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,473,984,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7678/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=1,474,176,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7679/500000] + train/ActionL1Loss=0.0619 + throughput/total_tokens=1,474,368,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7680/500000] + optim/total_grad_norm=8.905 + train/ActionL1Loss=0.0440 + throughput/total_tokens=1,474,560,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7681/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,474,752,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7682/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,474,944,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7683/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,475,136,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7684/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,475,328,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7685/500000] + train/ActionL1Loss=0.0307 + throughput/total_tokens=1,475,520,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7686/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,475,712,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7687/500000] + train/ActionL1Loss=0.0585 + throughput/total_tokens=1,475,904,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7688/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,476,096,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7689/500000] + train/ActionL1Loss=0.0323 + throughput/total_tokens=1,476,288,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7690/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,476,480,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7691/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=1,476,672,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7692/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,476,864,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7693/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,477,056,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7694/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,477,248,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7695/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,477,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7696/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,477,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7697/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,477,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7698/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,478,016,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7699/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=1,478,208,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7700/500000] + optim/total_grad_norm=8.011 + train/ActionL1Loss=0.0382 + throughput/total_tokens=1,478,400,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7701/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,478,592,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7702/500000] + train/ActionL1Loss=0.0368 + throughput/total_tokens=1,478,784,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7703/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=1,478,976,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=7704/500000] + train/ActionL1Loss=0.0350 + throughput/total_tokens=1,479,168,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7705/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=1,479,360,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7706/500000] + train/ActionL1Loss=0.0710 + throughput/total_tokens=1,479,552,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7707/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=1,479,744,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7708/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,479,936,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7709/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=1,480,128,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7710/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,480,320,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7711/500000] + train/ActionL1Loss=0.0340 + throughput/total_tokens=1,480,512,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7712/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=1,480,704,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7713/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,480,896,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7714/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,481,088,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7715/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,481,280,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7716/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,481,472,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7717/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=1,481,664,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7718/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,481,856,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7719/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=1,482,048,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7720/500000] + optim/total_grad_norm=9.160 + train/ActionL1Loss=0.0582 + throughput/total_tokens=1,482,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7721/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,482,432,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7722/500000] + train/ActionL1Loss=0.0356 + throughput/total_tokens=1,482,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7723/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,482,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7724/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,483,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7725/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,483,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7726/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,483,392,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7727/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,483,584,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7728/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=1,483,776,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7729/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=1,483,968,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7730/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,484,160,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7731/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=1,484,352,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7732/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=1,484,544,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7733/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=1,484,736,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7734/500000] + train/ActionL1Loss=0.0343 + throughput/total_tokens=1,484,928,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7735/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,485,120,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7736/500000] + train/ActionL1Loss=0.0354 + throughput/total_tokens=1,485,312,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7737/500000] + train/ActionL1Loss=0.0328 + throughput/total_tokens=1,485,504,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7738/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,485,696,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7739/500000] + train/ActionL1Loss=0.0347 + throughput/total_tokens=1,485,888,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7740/500000] + optim/total_grad_norm=8.354 + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,486,080,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7741/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,486,272,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7742/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=1,486,464,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7743/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,486,656,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7744/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=1,486,848,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7745/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,487,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7746/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,487,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7747/500000] + train/ActionL1Loss=0.0606 + throughput/total_tokens=1,487,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7748/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=1,487,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7749/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=1,487,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7750/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,488,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7751/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=1,488,192,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7752/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,488,384,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7753/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,488,576,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7754/500000] + train/ActionL1Loss=0.0282 + throughput/total_tokens=1,488,768,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7755/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=1,488,960,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7756/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,489,152,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7757/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=1,489,344,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7758/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=1,489,536,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7759/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,489,728,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7760/500000] + optim/total_grad_norm=8.198 + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,489,920,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7761/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=1,490,112,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7762/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,490,304,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7763/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=1,490,496,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7764/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,490,688,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7765/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=1,490,880,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7766/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=1,491,072,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7767/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,491,264,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7768/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,491,456,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7769/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,491,648,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7770/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,491,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7771/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=1,492,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7772/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,492,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7773/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,492,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7774/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,492,608,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7775/500000] + train/ActionL1Loss=0.0343 + throughput/total_tokens=1,492,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7776/500000] + train/ActionL1Loss=0.0657 + throughput/total_tokens=1,492,992,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7777/500000] + train/ActionL1Loss=0.0297 + throughput/total_tokens=1,493,184,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7778/500000] + train/ActionL1Loss=0.0622 + throughput/total_tokens=1,493,376,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7779/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,493,568,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7780/500000] + optim/total_grad_norm=8.720 + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,493,760,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7781/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,493,952,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7782/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,494,144,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=7783/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=1,494,336,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7784/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=1,494,528,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=7785/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=1,494,720,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=7786/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=1,494,912,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=7787/500000] + train/ActionL1Loss=0.0667 + throughput/total_tokens=1,495,104,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=7788/500000] + train/ActionL1Loss=0.0735 + throughput/total_tokens=1,495,296,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=7789/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=1,495,488,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=7790/500000] + train/ActionL1Loss=0.0617 + throughput/total_tokens=1,495,680,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=7791/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,495,872,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=7792/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=1,496,064,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=7793/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=1,496,256,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=7794/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,496,448,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=7795/500000] + train/ActionL1Loss=0.0364 + throughput/total_tokens=1,496,640,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7796/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=1,496,832,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7797/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=1,497,024,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7798/500000] + train/ActionL1Loss=0.0312 + throughput/total_tokens=1,497,216,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7799/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,497,408,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7800/500000] + optim/total_grad_norm=9.213 + train/ActionL1Loss=0.0438 + throughput/total_tokens=1,497,600,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7801/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,497,792,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7802/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=1,497,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7803/500000] + train/ActionL1Loss=0.0310 + throughput/total_tokens=1,498,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7804/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=1,498,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7805/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,498,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7806/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,498,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7807/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,498,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7808/500000] + train/ActionL1Loss=0.0236 + throughput/total_tokens=1,499,136,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7809/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=1,499,328,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7810/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,499,520,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7811/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=1,499,712,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7812/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=1,499,904,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7813/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=1,500,096,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7814/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,500,288,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7815/500000] + train/ActionL1Loss=0.0322 + throughput/total_tokens=1,500,480,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7816/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,500,672,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7817/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,500,864,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7818/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,501,056,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7819/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=1,501,248,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7820/500000] + optim/total_grad_norm=8.863 + train/ActionL1Loss=0.0598 + throughput/total_tokens=1,501,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7821/500000] + train/ActionL1Loss=0.0303 + throughput/total_tokens=1,501,632,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7822/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=1,501,824,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7823/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=1,502,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7824/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,502,208,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7825/500000] + train/ActionL1Loss=0.0347 + throughput/total_tokens=1,502,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7826/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,502,592,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7827/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,502,784,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7828/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=1,502,976,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7829/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,503,168,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7830/500000] + train/ActionL1Loss=0.0621 + throughput/total_tokens=1,503,360,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7831/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,503,552,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7832/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=1,503,744,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7833/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,503,936,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7834/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=1,504,128,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7835/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=1,504,320,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7836/500000] + train/ActionL1Loss=0.0260 + throughput/total_tokens=1,504,512,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7837/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=1,504,704,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7838/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=1,504,896,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7839/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=1,505,088,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7840/500000] + optim/total_grad_norm=7.854 + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,505,280,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7841/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,505,472,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7842/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=1,505,664,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7843/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=1,505,856,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7844/500000] + train/ActionL1Loss=0.0693 + throughput/total_tokens=1,506,048,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7845/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=1,506,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7846/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,506,432,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7847/500000] + train/ActionL1Loss=0.0364 + throughput/total_tokens=1,506,624,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7848/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=1,506,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7849/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,507,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7850/500000] + train/ActionL1Loss=0.0625 + throughput/total_tokens=1,507,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7851/500000] + train/ActionL1Loss=0.0323 + throughput/total_tokens=1,507,392,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7852/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,507,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7853/500000] + train/ActionL1Loss=0.0188 + throughput/total_tokens=1,507,776,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7854/500000] + train/ActionL1Loss=0.0372 + throughput/total_tokens=1,507,968,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7855/500000] + train/ActionL1Loss=0.0373 + throughput/total_tokens=1,508,160,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7856/500000] + train/ActionL1Loss=0.0325 + throughput/total_tokens=1,508,352,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7857/500000] + train/ActionL1Loss=0.0617 + throughput/total_tokens=1,508,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7858/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=1,508,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7859/500000] + train/ActionL1Loss=0.0316 + throughput/total_tokens=1,508,928,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7860/500000] + optim/total_grad_norm=8.752 + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,509,120,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7861/500000] + train/ActionL1Loss=0.0358 + throughput/total_tokens=1,509,312,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7862/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,509,504,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7863/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=1,509,696,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7864/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,509,888,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7865/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,510,080,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7866/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,510,272,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7867/500000] + train/ActionL1Loss=0.0264 + throughput/total_tokens=1,510,464,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7868/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=1,510,656,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7869/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=1,510,848,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7870/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=1,511,040,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7871/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,511,232,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7872/500000] + train/ActionL1Loss=0.0347 + throughput/total_tokens=1,511,424,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7873/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=1,511,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7874/500000] + train/ActionL1Loss=0.0564 + throughput/total_tokens=1,511,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7875/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,512,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7876/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,512,192,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7877/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=1,512,384,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7878/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,512,576,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7879/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,512,768,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7880/500000] + optim/total_grad_norm=7.555 + train/ActionL1Loss=0.0381 + throughput/total_tokens=1,512,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7881/500000] + train/ActionL1Loss=0.0277 + throughput/total_tokens=1,513,152,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7882/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,513,344,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7883/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,513,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7884/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=1,513,728,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7885/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,513,920,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7886/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=1,514,112,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7887/500000] + train/ActionL1Loss=0.0338 + throughput/total_tokens=1,514,304,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=7888/500000] + train/ActionL1Loss=0.0587 + throughput/total_tokens=1,514,496,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7889/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,514,688,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7890/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=1,514,880,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7891/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,515,072,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7892/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,515,264,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7893/500000] + train/ActionL1Loss=0.0340 + throughput/total_tokens=1,515,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7894/500000] + train/ActionL1Loss=0.0629 + throughput/total_tokens=1,515,648,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7895/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=1,515,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7896/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=1,516,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7897/500000] + train/ActionL1Loss=0.0344 + throughput/total_tokens=1,516,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7898/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,516,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7899/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,516,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7900/500000] + optim/total_grad_norm=8.546 + train/ActionL1Loss=0.0567 + throughput/total_tokens=1,516,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=7901/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=1,516,992,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7902/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=1,517,184,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7903/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=1,517,376,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7904/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,517,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7905/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,517,760,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7906/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,517,952,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7907/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=1,518,144,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7908/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,518,336,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7909/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,518,528,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7910/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,518,720,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=7911/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=1,518,912,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7912/500000] + train/ActionL1Loss=0.0351 + throughput/total_tokens=1,519,104,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7913/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=1,519,296,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7914/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=1,519,488,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7915/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=1,519,680,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7916/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=1,519,872,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7917/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,520,064,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7918/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,520,256,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7919/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,520,448,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=7920/500000] + optim/total_grad_norm=8.852 + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,520,640,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7921/500000] + train/ActionL1Loss=0.0354 + throughput/total_tokens=1,520,832,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7922/500000] + train/ActionL1Loss=0.0191 + throughput/total_tokens=1,521,024,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7923/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,521,216,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7924/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=1,521,408,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7925/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=1,521,600,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7926/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,521,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7927/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,521,984,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7928/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,522,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7929/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,522,368,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7930/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=1,522,560,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7931/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,522,752,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7932/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,522,944,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7933/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=1,523,136,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7934/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=1,523,328,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7935/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,523,520,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7936/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=1,523,712,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7937/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=1,523,904,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7938/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,524,096,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7939/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=1,524,288,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7940/500000] + optim/total_grad_norm=8.501 + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,524,480,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7941/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=1,524,672,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7942/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=1,524,864,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7943/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=1,525,056,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7944/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=1,525,248,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7945/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=1,525,440,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7946/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,525,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7947/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=1,525,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7948/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=1,526,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7949/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,526,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7950/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,526,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7951/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,526,592,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=7952/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=1,526,784,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=7953/500000] + train/ActionL1Loss=0.0343 + throughput/total_tokens=1,526,976,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7954/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,527,168,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7955/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=1,527,360,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7956/500000] + train/ActionL1Loss=0.0359 + throughput/total_tokens=1,527,552,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7957/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,527,744,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7958/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,527,936,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7959/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,528,128,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7960/500000] + optim/total_grad_norm=8.610 + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,528,320,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7961/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,528,512,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7962/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=1,528,704,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=7963/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=1,528,896,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7964/500000] + train/ActionL1Loss=0.0205 + throughput/total_tokens=1,529,088,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=7965/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,529,280,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7966/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,529,472,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7967/500000] + train/ActionL1Loss=0.0264 + throughput/total_tokens=1,529,664,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7968/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,529,856,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7969/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,530,048,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=7970/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,530,240,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=7971/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=1,530,432,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7972/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=1,530,624,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7973/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,530,816,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7974/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,531,008,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7975/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,531,200,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=7976/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=1,531,392,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7977/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=1,531,584,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7978/500000] + train/ActionL1Loss=0.0387 + throughput/total_tokens=1,531,776,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=7979/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=1,531,968,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7980/500000] + optim/total_grad_norm=8.026 + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,532,160,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7981/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=1,532,352,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=7982/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=1,532,544,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7983/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,532,736,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7984/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=1,532,928,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7985/500000] + train/ActionL1Loss=0.0301 + throughput/total_tokens=1,533,120,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7986/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,533,312,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7987/500000] + train/ActionL1Loss=0.0349 + throughput/total_tokens=1,533,504,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7988/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,533,696,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7989/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=1,533,888,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7990/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,534,080,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=7991/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,534,272,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=7992/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,534,464,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7993/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,534,656,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7994/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=1,534,848,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=7995/500000] + train/ActionL1Loss=0.0279 + throughput/total_tokens=1,535,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7996/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,535,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7997/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,535,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7998/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=1,535,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=7999/500000] + train/ActionL1Loss=0.0372 + throughput/total_tokens=1,535,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8000/500000] + optim/total_grad_norm=8.380 + train/ActionL1Loss=0.0335 + throughput/total_tokens=1,536,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +10/13 [15:11:30] INFO | >> Saving config... checkpoint.py:608 +10/13 [15:12:02] INFO | >> Saving model state... checkpoint.py:796 +10/13 [15:13:09] INFO | >> Saving optim state... checkpoint.py:811 +10/13 [15:14:41] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=8001/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,536,192,000 + throughput/device/tokens_per_second=1,211 + throughput/device/batches_per_second=0.0505 +[step=8002/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,536,384,000 + throughput/device/tokens_per_second=1,190 + throughput/device/batches_per_second=0.0496 +[step=8003/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,536,576,000 + throughput/device/tokens_per_second=1,185 + throughput/device/batches_per_second=0.0494 +[step=8004/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,536,768,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=8005/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=1,536,960,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8006/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=1,537,152,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=8007/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=1,537,344,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8008/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=1,537,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8009/500000] + train/ActionL1Loss=0.0626 + throughput/total_tokens=1,537,728,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8010/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=1,537,920,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8011/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,538,112,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8012/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=1,538,304,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8013/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,538,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8014/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=1,538,688,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8015/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=1,538,880,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8016/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,539,072,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8017/500000] + train/ActionL1Loss=0.0276 + throughput/total_tokens=1,539,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8018/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,539,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8019/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=1,539,648,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8020/500000] + optim/total_grad_norm=6.827 + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,539,840,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8021/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,540,032,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8022/500000] + train/ActionL1Loss=0.0368 + throughput/total_tokens=1,540,224,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8023/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,540,416,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8024/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,540,608,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8025/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=1,540,800,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8026/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=1,540,992,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8027/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,541,184,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8028/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=1,541,376,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8029/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=1,541,568,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8030/500000] + train/ActionL1Loss=0.0328 + throughput/total_tokens=1,541,760,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8031/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=1,541,952,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8032/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,542,144,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8033/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,542,336,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8034/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,542,528,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8035/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,542,720,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8036/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,542,912,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8037/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=1,543,104,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8038/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=1,543,296,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8039/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=1,543,488,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8040/500000] + optim/total_grad_norm=8.776 + train/ActionL1Loss=0.0594 + throughput/total_tokens=1,543,680,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8041/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,543,872,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8042/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,544,064,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8043/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,544,256,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8044/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=1,544,448,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8045/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,544,640,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8046/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,544,832,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8047/500000] + train/ActionL1Loss=0.0648 + throughput/total_tokens=1,545,024,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8048/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,545,216,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8049/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=1,545,408,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8050/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=1,545,600,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8051/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=1,545,792,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8052/500000] + train/ActionL1Loss=0.0284 + throughput/total_tokens=1,545,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8053/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,546,176,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8054/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=1,546,368,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8055/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,546,560,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8056/500000] + train/ActionL1Loss=0.0328 + throughput/total_tokens=1,546,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8057/500000] + train/ActionL1Loss=0.0354 + throughput/total_tokens=1,546,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8058/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,547,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8059/500000] + train/ActionL1Loss=0.0231 + throughput/total_tokens=1,547,328,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8060/500000] + optim/total_grad_norm=9.675 + train/ActionL1Loss=0.0533 + throughput/total_tokens=1,547,520,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8061/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,547,712,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8062/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,547,904,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8063/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,548,096,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8064/500000] + train/ActionL1Loss=0.0316 + throughput/total_tokens=1,548,288,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8065/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=1,548,480,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8066/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,548,672,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8067/500000] + train/ActionL1Loss=0.0316 + throughput/total_tokens=1,548,864,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8068/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,549,056,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8069/500000] + train/ActionL1Loss=0.0600 + throughput/total_tokens=1,549,248,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8070/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=1,549,440,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8071/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,549,632,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8072/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=1,549,824,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8073/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=1,550,016,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8074/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,550,208,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8075/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=1,550,400,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8076/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,550,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8077/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,550,784,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8078/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,550,976,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8079/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=1,551,168,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8080/500000] + optim/total_grad_norm=9.664 + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,551,360,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8081/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=1,551,552,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8082/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=1,551,744,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8083/500000] + train/ActionL1Loss=0.0335 + throughput/total_tokens=1,551,936,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8084/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,552,128,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8085/500000] + train/ActionL1Loss=0.0346 + throughput/total_tokens=1,552,320,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8086/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=1,552,512,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8087/500000] + train/ActionL1Loss=0.0240 + throughput/total_tokens=1,552,704,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8088/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,552,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8089/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=1,553,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8090/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,553,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8091/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,553,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8092/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,553,664,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8093/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=1,553,856,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8094/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=1,554,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8095/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,554,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8096/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,554,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8097/500000] + train/ActionL1Loss=0.0328 + throughput/total_tokens=1,554,624,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8098/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=1,554,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8099/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,555,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8100/500000] + optim/total_grad_norm=7.880 + train/ActionL1Loss=0.0543 + throughput/total_tokens=1,555,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8101/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,555,392,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8102/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=1,555,584,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8103/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,555,776,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8104/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=1,555,968,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8105/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,556,160,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8106/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=1,556,352,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8107/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=1,556,544,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8108/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=1,556,736,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8109/500000] + train/ActionL1Loss=0.0355 + throughput/total_tokens=1,556,928,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8110/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=1,557,120,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8111/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=1,557,312,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8112/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,557,504,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8113/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=1,557,696,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8114/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=1,557,888,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8115/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,558,080,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8116/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=1,558,272,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8117/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,558,464,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8118/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,558,656,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8119/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,558,848,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8120/500000] + optim/total_grad_norm=7.383 + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,559,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8121/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,559,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8122/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,559,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8123/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=1,559,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8124/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,559,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8125/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=1,560,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8126/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=1,560,192,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8127/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,560,384,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8128/500000] + train/ActionL1Loss=0.0281 + throughput/total_tokens=1,560,576,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8129/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,560,768,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8130/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,560,960,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8131/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,561,152,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8132/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,561,344,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8133/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,561,536,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8134/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=1,561,728,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8135/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=1,561,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8136/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,562,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8137/500000] + train/ActionL1Loss=0.0562 + throughput/total_tokens=1,562,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8138/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=1,562,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8139/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,562,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8140/500000] + optim/total_grad_norm=8.985 + train/ActionL1Loss=0.0380 + throughput/total_tokens=1,562,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8141/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,563,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8142/500000] + train/ActionL1Loss=0.0564 + throughput/total_tokens=1,563,264,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8143/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=1,563,456,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8144/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,563,648,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8145/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=1,563,840,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8146/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,564,032,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8147/500000] + train/ActionL1Loss=0.0266 + throughput/total_tokens=1,564,224,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8148/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=1,564,416,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8149/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,564,608,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=8150/500000] + train/ActionL1Loss=0.0247 + throughput/total_tokens=1,564,800,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8151/500000] + train/ActionL1Loss=0.0305 + throughput/total_tokens=1,564,992,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8152/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,565,184,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8153/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,565,376,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8154/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=1,565,568,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8155/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,565,760,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8156/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=1,565,952,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8157/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,566,144,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8158/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,566,336,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8159/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,566,528,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8160/500000] + optim/total_grad_norm=8.666 + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,566,720,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8161/500000] + train/ActionL1Loss=0.0336 + throughput/total_tokens=1,566,912,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8162/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=1,567,104,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8163/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=1,567,296,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8164/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,567,488,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8165/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,567,680,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8166/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=1,567,872,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8167/500000] + train/ActionL1Loss=0.0693 + throughput/total_tokens=1,568,064,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=8168/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,568,256,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8169/500000] + train/ActionL1Loss=0.0350 + throughput/total_tokens=1,568,448,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8170/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,568,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8171/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,568,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8172/500000] + train/ActionL1Loss=0.0328 + throughput/total_tokens=1,569,024,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8173/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=1,569,216,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8174/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,569,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8175/500000] + train/ActionL1Loss=0.0564 + throughput/total_tokens=1,569,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8176/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,569,792,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8177/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,569,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8178/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,570,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8179/500000] + train/ActionL1Loss=0.0329 + throughput/total_tokens=1,570,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8180/500000] + optim/total_grad_norm=8.532 + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,570,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8181/500000] + train/ActionL1Loss=0.0336 + throughput/total_tokens=1,570,752,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8182/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,570,944,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8183/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=1,571,136,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8184/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,571,328,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8185/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=1,571,520,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8186/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=1,571,712,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8187/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,571,904,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8188/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,572,096,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8189/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,572,288,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8190/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,572,480,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8191/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,572,672,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8192/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,572,864,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8193/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,573,056,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8194/500000] + train/ActionL1Loss=0.0351 + throughput/total_tokens=1,573,248,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8195/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,573,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8196/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=1,573,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8197/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,573,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8198/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=1,574,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8199/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,574,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8200/500000] + optim/total_grad_norm=8.888 + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,574,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8201/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=1,574,592,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8202/500000] + train/ActionL1Loss=0.0272 + throughput/total_tokens=1,574,784,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8203/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=1,574,976,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8204/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,575,168,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8205/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=1,575,360,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8206/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,575,552,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8207/500000] + train/ActionL1Loss=0.0242 + throughput/total_tokens=1,575,744,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=8208/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,575,936,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=8209/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,576,128,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8210/500000] + train/ActionL1Loss=0.0295 + throughput/total_tokens=1,576,320,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 + System/Peak GPU Memory (MB)=46,924 +[step=8211/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,576,512,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=8212/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,576,704,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=8213/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,576,896,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=8214/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,577,088,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=8215/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=1,577,280,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=8216/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=1,577,472,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=8217/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=1,577,664,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=8218/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=1,577,856,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=8219/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=1,578,048,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=8220/500000] + optim/total_grad_norm=8.796 + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,578,240,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8221/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,578,432,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8222/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,578,624,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8223/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=1,578,816,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8224/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,579,008,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8225/500000] + train/ActionL1Loss=0.0288 + throughput/total_tokens=1,579,200,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8226/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,579,392,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8227/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,579,584,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8228/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=1,579,776,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8229/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=1,579,968,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8230/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=1,580,160,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8231/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=1,580,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8232/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,580,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8233/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=1,580,736,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8234/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,580,928,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8235/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=1,581,120,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8236/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,581,312,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8237/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=1,581,504,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8238/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=1,581,696,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8239/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=1,581,888,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8240/500000] + optim/total_grad_norm=7.516 + train/ActionL1Loss=0.0348 + throughput/total_tokens=1,582,080,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8241/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=1,582,272,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8242/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=1,582,464,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8243/500000] + train/ActionL1Loss=0.0233 + throughput/total_tokens=1,582,656,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8244/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=1,582,848,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8245/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,583,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8246/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=1,583,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8247/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,583,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8248/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=1,583,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8249/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,583,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8250/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,584,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8251/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,584,192,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8252/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,584,384,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8253/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=1,584,576,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8254/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=1,584,768,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8255/500000] + train/ActionL1Loss=0.0321 + throughput/total_tokens=1,584,960,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8256/500000] + train/ActionL1Loss=0.0358 + throughput/total_tokens=1,585,152,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8257/500000] + train/ActionL1Loss=0.0641 + throughput/total_tokens=1,585,344,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8258/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,585,536,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8259/500000] + train/ActionL1Loss=0.0627 + throughput/total_tokens=1,585,728,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8260/500000] + optim/total_grad_norm=7.473 + train/ActionL1Loss=0.0373 + throughput/total_tokens=1,585,920,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8261/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=1,586,112,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8262/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,586,304,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8263/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,586,496,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8264/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=1,586,688,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8265/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,586,880,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8266/500000] + train/ActionL1Loss=0.0344 + throughput/total_tokens=1,587,072,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8267/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=1,587,264,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8268/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,587,456,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8269/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=1,587,648,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8270/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,587,840,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8271/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=1,588,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8272/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,588,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8273/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=1,588,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8274/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=1,588,608,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8275/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,588,800,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8276/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=1,588,992,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8277/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,589,184,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8278/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,589,376,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8279/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,589,568,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8280/500000] + optim/total_grad_norm=10.74 + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,589,760,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8281/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,589,952,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8282/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,590,144,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8283/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,590,336,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8284/500000] + train/ActionL1Loss=0.0335 + throughput/total_tokens=1,590,528,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8285/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,590,720,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8286/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,590,912,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8287/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=1,591,104,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8288/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,591,296,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8289/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=1,591,488,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8290/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=1,591,680,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8291/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,591,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8292/500000] + train/ActionL1Loss=0.0353 + throughput/total_tokens=1,592,064,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8293/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,592,256,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8294/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,592,448,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8295/500000] + train/ActionL1Loss=0.0659 + throughput/total_tokens=1,592,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8296/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,592,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8297/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,593,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8298/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=1,593,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8299/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,593,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8300/500000] + optim/total_grad_norm=8.732 + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,593,600,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8301/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=1,593,792,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8302/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,593,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8303/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=1,594,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8304/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,594,368,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8305/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,594,560,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8306/500000] + train/ActionL1Loss=0.0306 + throughput/total_tokens=1,594,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8307/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,594,944,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8308/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=1,595,136,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8309/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=1,595,328,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8310/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,595,520,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8311/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=1,595,712,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8312/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,595,904,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8313/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=1,596,096,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8314/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,596,288,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8315/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,596,480,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8316/500000] + train/ActionL1Loss=0.0373 + throughput/total_tokens=1,596,672,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=8317/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,596,864,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8318/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=1,597,056,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8319/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=1,597,248,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8320/500000] + optim/total_grad_norm=7.695 + train/ActionL1Loss=0.0378 + throughput/total_tokens=1,597,440,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8321/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=1,597,632,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8322/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=1,597,824,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8323/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,598,016,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8324/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,598,208,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8325/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=1,598,400,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8326/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,598,592,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8327/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=1,598,784,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8328/500000] + train/ActionL1Loss=0.0349 + throughput/total_tokens=1,598,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8329/500000] + train/ActionL1Loss=0.0628 + throughput/total_tokens=1,599,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8330/500000] + train/ActionL1Loss=0.0321 + throughput/total_tokens=1,599,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8331/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=1,599,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8332/500000] + train/ActionL1Loss=0.0641 + throughput/total_tokens=1,599,744,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8333/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,599,936,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8334/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=1,600,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8335/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=1,600,320,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8336/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=1,600,512,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8337/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,600,704,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8338/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,600,896,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8339/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,601,088,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8340/500000] + optim/total_grad_norm=7.811 + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,601,280,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8341/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=1,601,472,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8342/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,601,664,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8343/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,601,856,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8344/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,602,048,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8345/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,602,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8346/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,602,432,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8347/500000] + train/ActionL1Loss=0.0311 + throughput/total_tokens=1,602,624,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8348/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=1,602,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8349/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,603,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8350/500000] + train/ActionL1Loss=0.0300 + throughput/total_tokens=1,603,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8351/500000] + train/ActionL1Loss=0.0325 + throughput/total_tokens=1,603,392,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8352/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,603,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8353/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,603,776,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8354/500000] + train/ActionL1Loss=0.0715 + throughput/total_tokens=1,603,968,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8355/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,604,160,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8356/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=1,604,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8357/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=1,604,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8358/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=1,604,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8359/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,604,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8360/500000] + optim/total_grad_norm=6.203 + train/ActionL1Loss=0.0382 + throughput/total_tokens=1,605,120,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8361/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,605,312,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8362/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=1,605,504,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8363/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,605,696,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8364/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=1,605,888,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8365/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=1,606,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8366/500000] + train/ActionL1Loss=0.0348 + throughput/total_tokens=1,606,272,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8367/500000] + train/ActionL1Loss=0.0593 + throughput/total_tokens=1,606,464,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8368/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,606,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8369/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=1,606,848,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8370/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=1,607,040,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8371/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=1,607,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8372/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=1,607,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8373/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,607,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8374/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=1,607,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8375/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=1,608,000,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8376/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,608,192,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8377/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=1,608,384,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8378/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=1,608,576,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8379/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=1,608,768,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8380/500000] + optim/total_grad_norm=9.058 + train/ActionL1Loss=0.0581 + throughput/total_tokens=1,608,960,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8381/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=1,609,152,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8382/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=1,609,344,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8383/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,609,536,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8384/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,609,728,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8385/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,609,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8386/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=1,610,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8387/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,610,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8388/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,610,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8389/500000] + train/ActionL1Loss=0.0343 + throughput/total_tokens=1,610,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8390/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,610,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8391/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,611,072,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8392/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,611,264,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8393/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,611,456,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8394/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=1,611,648,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8395/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=1,611,840,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8396/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=1,612,032,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8397/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,612,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8398/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=1,612,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8399/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,612,608,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8400/500000] + optim/total_grad_norm=8.143 + train/ActionL1Loss=0.0277 + throughput/total_tokens=1,612,800,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8401/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,612,992,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8402/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,613,184,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8403/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,613,376,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8404/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=1,613,568,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8405/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=1,613,760,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8406/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,613,952,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8407/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,614,144,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8408/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,614,336,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=8409/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=1,614,528,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8410/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,614,720,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8411/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=1,614,912,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8412/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=1,615,104,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8413/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=1,615,296,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8414/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=1,615,488,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8415/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,615,680,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8416/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,615,872,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8417/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=1,616,064,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8418/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,616,256,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8419/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,616,448,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8420/500000] + optim/total_grad_norm=9.782 + train/ActionL1Loss=0.0315 + throughput/total_tokens=1,616,640,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=8421/500000] + train/ActionL1Loss=0.0284 + throughput/total_tokens=1,616,832,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8422/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,617,024,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8423/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=1,617,216,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8424/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,617,408,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8425/500000] + train/ActionL1Loss=0.0358 + throughput/total_tokens=1,617,600,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8426/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,617,792,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8427/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,617,984,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8428/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,618,176,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8429/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,618,368,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8430/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=1,618,560,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8431/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,618,752,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8432/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,618,944,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8433/500000] + train/ActionL1Loss=0.0278 + throughput/total_tokens=1,619,136,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8434/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,619,328,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8435/500000] + train/ActionL1Loss=0.0355 + throughput/total_tokens=1,619,520,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8436/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=1,619,712,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8437/500000] + train/ActionL1Loss=0.0387 + throughput/total_tokens=1,619,904,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8438/500000] + train/ActionL1Loss=0.0319 + throughput/total_tokens=1,620,096,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8439/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=1,620,288,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8440/500000] + optim/total_grad_norm=9.010 + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,620,480,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8441/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,620,672,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8442/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,620,864,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8443/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,621,056,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8444/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,621,248,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8445/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=1,621,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8446/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,621,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8447/500000] + train/ActionL1Loss=0.0338 + throughput/total_tokens=1,621,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8448/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=1,622,016,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8449/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,622,208,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8450/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,622,400,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8451/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=1,622,592,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=8452/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=1,622,784,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=8453/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,622,976,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=8454/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,623,168,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=8455/500000] + train/ActionL1Loss=0.0314 + throughput/total_tokens=1,623,360,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=8456/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=1,623,552,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=8457/500000] + train/ActionL1Loss=0.0192 + throughput/total_tokens=1,623,744,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=8458/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=1,623,936,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=8459/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,624,128,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=8460/500000] + optim/total_grad_norm=8.589 + train/ActionL1Loss=0.0643 + throughput/total_tokens=1,624,320,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=8461/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,624,512,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8462/500000] + train/ActionL1Loss=0.0263 + throughput/total_tokens=1,624,704,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8463/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,624,896,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8464/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,625,088,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8465/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,625,280,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8466/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=1,625,472,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8467/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=1,625,664,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8468/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=1,625,856,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8469/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,626,048,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8470/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=1,626,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8471/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,626,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8472/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,626,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8473/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,626,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8474/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=1,627,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8475/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,627,200,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8476/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,627,392,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8477/500000] + train/ActionL1Loss=0.0353 + throughput/total_tokens=1,627,584,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8478/500000] + train/ActionL1Loss=0.0262 + throughput/total_tokens=1,627,776,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8479/500000] + train/ActionL1Loss=0.0644 + throughput/total_tokens=1,627,968,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8480/500000] + optim/total_grad_norm=9.882 + train/ActionL1Loss=0.0556 + throughput/total_tokens=1,628,160,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8481/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,628,352,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8482/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=1,628,544,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8483/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,628,736,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8484/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,628,928,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8485/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=1,629,120,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8486/500000] + train/ActionL1Loss=0.0757 + throughput/total_tokens=1,629,312,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=8487/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=1,629,504,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=8488/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,629,696,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=8489/500000] + train/ActionL1Loss=0.0303 + throughput/total_tokens=1,629,888,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8490/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,630,080,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8491/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=1,630,272,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8492/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=1,630,464,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8493/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=1,630,656,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8494/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=1,630,848,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8495/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=1,631,040,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8496/500000] + train/ActionL1Loss=0.0329 + throughput/total_tokens=1,631,232,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8497/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=1,631,424,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8498/500000] + train/ActionL1Loss=0.0584 + throughput/total_tokens=1,631,616,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8499/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,631,808,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8500/500000] + optim/total_grad_norm=8.904 + train/ActionL1Loss=0.0409 + throughput/total_tokens=1,632,000,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +10/13 [18:06:02] INFO | >> Saving config... checkpoint.py:608 +10/13 [18:06:34] INFO | >> Saving model state... checkpoint.py:796 +10/13 [18:07:46] INFO | >> Saving optim state... checkpoint.py:811 +10/13 [18:09:17] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=8501/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,632,192,000 + throughput/device/tokens_per_second=1,213 + throughput/device/batches_per_second=0.0505 +[step=8502/500000] + train/ActionL1Loss=0.0313 + throughput/total_tokens=1,632,384,000 + throughput/device/tokens_per_second=1,188 + throughput/device/batches_per_second=0.0495 +[step=8503/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,632,576,000 + throughput/device/tokens_per_second=1,185 + throughput/device/batches_per_second=0.0494 +[step=8504/500000] + train/ActionL1Loss=0.0664 + throughput/total_tokens=1,632,768,000 + throughput/device/tokens_per_second=1,186 + throughput/device/batches_per_second=0.0495 +[step=8505/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=1,632,960,000 + throughput/device/tokens_per_second=1,184 + throughput/device/batches_per_second=0.0494 +[step=8506/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,633,152,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=8507/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=1,633,344,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=8508/500000] + train/ActionL1Loss=0.0351 + throughput/total_tokens=1,633,536,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=8509/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,633,728,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8510/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=1,633,920,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=8511/500000] + train/ActionL1Loss=0.0292 + throughput/total_tokens=1,634,112,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8512/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=1,634,304,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8513/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,634,496,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8514/500000] + train/ActionL1Loss=0.0312 + throughput/total_tokens=1,634,688,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8515/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=1,634,880,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8516/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=1,635,072,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8517/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,635,264,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8518/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=1,635,456,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8519/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,635,648,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8520/500000] + optim/total_grad_norm=8.759 + train/ActionL1Loss=0.0384 + throughput/total_tokens=1,635,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8521/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=1,636,032,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8522/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=1,636,224,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8523/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,636,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8524/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,636,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8525/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,636,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8526/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,636,992,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8527/500000] + train/ActionL1Loss=0.0647 + throughput/total_tokens=1,637,184,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8528/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,637,376,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8529/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,637,568,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8530/500000] + train/ActionL1Loss=0.0335 + throughput/total_tokens=1,637,760,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8531/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=1,637,952,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8532/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=1,638,144,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8533/500000] + train/ActionL1Loss=0.0321 + throughput/total_tokens=1,638,336,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8534/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,638,528,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8535/500000] + train/ActionL1Loss=0.0271 + throughput/total_tokens=1,638,720,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8536/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=1,638,912,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8537/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=1,639,104,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8538/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,639,296,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8539/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,639,488,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8540/500000] + optim/total_grad_norm=9.250 + train/ActionL1Loss=0.0417 + throughput/total_tokens=1,639,680,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8541/500000] + train/ActionL1Loss=0.0294 + throughput/total_tokens=1,639,872,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8542/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,640,064,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8543/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,640,256,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8544/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=1,640,448,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8545/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,640,640,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8546/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=1,640,832,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8547/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,641,024,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8548/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=1,641,216,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8549/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=1,641,408,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8550/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=1,641,600,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8551/500000] + train/ActionL1Loss=0.0229 + throughput/total_tokens=1,641,792,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8552/500000] + train/ActionL1Loss=0.0310 + throughput/total_tokens=1,641,984,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8553/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=1,642,176,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8554/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,642,368,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8555/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=1,642,560,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8556/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=1,642,752,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=8557/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=1,642,944,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=8558/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,643,136,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=8559/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,643,328,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 +[step=8560/500000] + optim/total_grad_norm=8.405 + train/ActionL1Loss=0.0583 + throughput/total_tokens=1,643,520,000 + throughput/device/tokens_per_second=1,170 + throughput/device/batches_per_second=0.0488 + System/Peak GPU Memory (MB)=46,924 +[step=8561/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,643,712,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=8562/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=1,643,904,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8563/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,644,096,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8564/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,644,288,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8565/500000] + train/ActionL1Loss=0.0341 + throughput/total_tokens=1,644,480,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8566/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,644,672,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8567/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,644,864,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8568/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=1,645,056,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8569/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,645,248,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8570/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=1,645,440,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8571/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=1,645,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8572/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,645,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8573/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=1,646,016,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8574/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=1,646,208,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8575/500000] + train/ActionL1Loss=0.0279 + throughput/total_tokens=1,646,400,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8576/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,646,592,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8577/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,646,784,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8578/500000] + train/ActionL1Loss=0.0283 + throughput/total_tokens=1,646,976,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8579/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=1,647,168,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8580/500000] + optim/total_grad_norm=8.140 + train/ActionL1Loss=0.0326 + throughput/total_tokens=1,647,360,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8581/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=1,647,552,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8582/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=1,647,744,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8583/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=1,647,936,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8584/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=1,648,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8585/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,648,320,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8586/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,648,512,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8587/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,648,704,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8588/500000] + train/ActionL1Loss=0.0611 + throughput/total_tokens=1,648,896,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8589/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=1,649,088,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8590/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,649,280,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8591/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,649,472,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8592/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=1,649,664,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8593/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,649,856,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8594/500000] + train/ActionL1Loss=0.0354 + throughput/total_tokens=1,650,048,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8595/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=1,650,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8596/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,650,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8597/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=1,650,624,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8598/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,650,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8599/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=1,651,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8600/500000] + optim/total_grad_norm=8.169 + train/ActionL1Loss=0.0395 + throughput/total_tokens=1,651,200,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8601/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,651,392,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8602/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=1,651,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8603/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,651,776,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8604/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=1,651,968,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8605/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,652,160,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8606/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=1,652,352,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8607/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,652,544,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8608/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=1,652,736,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8609/500000] + train/ActionL1Loss=0.0350 + throughput/total_tokens=1,652,928,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8610/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=1,653,120,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=8611/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,653,312,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8612/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=1,653,504,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8613/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,653,696,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8614/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,653,888,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8615/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,654,080,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8616/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=1,654,272,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8617/500000] + train/ActionL1Loss=0.0322 + throughput/total_tokens=1,654,464,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8618/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,654,656,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8619/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=1,654,848,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8620/500000] + optim/total_grad_norm=10.17 + train/ActionL1Loss=0.0561 + throughput/total_tokens=1,655,040,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8621/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=1,655,232,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8622/500000] + train/ActionL1Loss=0.0660 + throughput/total_tokens=1,655,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8623/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,655,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8624/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=1,655,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8625/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=1,656,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8626/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,656,192,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8627/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=1,656,384,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8628/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,656,576,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8629/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,656,768,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8630/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,656,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8631/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,657,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8632/500000] + train/ActionL1Loss=0.0334 + throughput/total_tokens=1,657,344,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8633/500000] + train/ActionL1Loss=0.0323 + throughput/total_tokens=1,657,536,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8634/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,657,728,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8635/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,657,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8636/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,658,112,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8637/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=1,658,304,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8638/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,658,496,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8639/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,658,688,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8640/500000] + optim/total_grad_norm=7.642 + train/ActionL1Loss=0.0365 + throughput/total_tokens=1,658,880,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8641/500000] + train/ActionL1Loss=0.0347 + throughput/total_tokens=1,659,072,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8642/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,659,264,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8643/500000] + train/ActionL1Loss=0.0253 + throughput/total_tokens=1,659,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8644/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,659,648,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8645/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=1,659,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8646/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=1,660,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8647/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,660,224,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8648/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,660,416,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8649/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,660,608,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8650/500000] + train/ActionL1Loss=0.0354 + throughput/total_tokens=1,660,800,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8651/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,660,992,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8652/500000] + train/ActionL1Loss=0.0206 + throughput/total_tokens=1,661,184,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8653/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=1,661,376,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8654/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,661,568,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8655/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=1,661,760,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8656/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,661,952,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8657/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,662,144,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8658/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=1,662,336,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8659/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,662,528,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=8660/500000] + optim/total_grad_norm=9.421 + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,662,720,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=8661/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,662,912,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8662/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,663,104,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8663/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,663,296,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8664/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,663,488,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8665/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,663,680,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=8666/500000] + train/ActionL1Loss=0.0193 + throughput/total_tokens=1,663,872,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8667/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,664,064,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8668/500000] + train/ActionL1Loss=0.0268 + throughput/total_tokens=1,664,256,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8669/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,664,448,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8670/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=1,664,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8671/500000] + train/ActionL1Loss=0.0310 + throughput/total_tokens=1,664,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8672/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=1,665,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8673/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,665,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8674/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,665,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8675/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,665,600,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8676/500000] + train/ActionL1Loss=0.0589 + throughput/total_tokens=1,665,792,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8677/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,665,984,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8678/500000] + train/ActionL1Loss=0.0312 + throughput/total_tokens=1,666,176,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8679/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,666,368,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8680/500000] + optim/total_grad_norm=5.993 + train/ActionL1Loss=0.0601 + throughput/total_tokens=1,666,560,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8681/500000] + train/ActionL1Loss=0.0344 + throughput/total_tokens=1,666,752,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8682/500000] + train/ActionL1Loss=0.0235 + throughput/total_tokens=1,666,944,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8683/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,667,136,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8684/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=1,667,328,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8685/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,667,520,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8686/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,667,712,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8687/500000] + train/ActionL1Loss=0.0600 + throughput/total_tokens=1,667,904,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8688/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,668,096,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8689/500000] + train/ActionL1Loss=0.0325 + throughput/total_tokens=1,668,288,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8690/500000] + train/ActionL1Loss=0.0372 + throughput/total_tokens=1,668,480,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8691/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,668,672,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8692/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=1,668,864,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8693/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=1,669,056,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8694/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,669,248,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8695/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,669,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8696/500000] + train/ActionL1Loss=0.0295 + throughput/total_tokens=1,669,632,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8697/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,669,824,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8698/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=1,670,016,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8699/500000] + train/ActionL1Loss=0.0672 + throughput/total_tokens=1,670,208,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8700/500000] + optim/total_grad_norm=7.666 + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,670,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8701/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,670,592,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8702/500000] + train/ActionL1Loss=0.0296 + throughput/total_tokens=1,670,784,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8703/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,670,976,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8704/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,671,168,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8705/500000] + train/ActionL1Loss=0.0651 + throughput/total_tokens=1,671,360,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8706/500000] + train/ActionL1Loss=0.0325 + throughput/total_tokens=1,671,552,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8707/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,671,744,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8708/500000] + train/ActionL1Loss=0.0372 + throughput/total_tokens=1,671,936,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=8709/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=1,672,128,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=8710/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=1,672,320,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8711/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=1,672,512,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8712/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,672,704,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8713/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,672,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8714/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,673,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8715/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,673,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8716/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,673,472,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8717/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=1,673,664,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8718/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,673,856,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8719/500000] + train/ActionL1Loss=0.0343 + throughput/total_tokens=1,674,048,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8720/500000] + optim/total_grad_norm=8.189 + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,674,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8721/500000] + train/ActionL1Loss=0.0634 + throughput/total_tokens=1,674,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8722/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=1,674,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8723/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,674,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8724/500000] + train/ActionL1Loss=0.0665 + throughput/total_tokens=1,675,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8725/500000] + train/ActionL1Loss=0.0324 + throughput/total_tokens=1,675,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8726/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=1,675,392,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8727/500000] + train/ActionL1Loss=0.0674 + throughput/total_tokens=1,675,584,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8728/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=1,675,776,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8729/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,675,968,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8730/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=1,676,160,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8731/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=1,676,352,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8732/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=1,676,544,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8733/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=1,676,736,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8734/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=1,676,928,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8735/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=1,677,120,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8736/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,677,312,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8737/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=1,677,504,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8738/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,677,696,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8739/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,677,888,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8740/500000] + optim/total_grad_norm=7.810 + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,678,080,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8741/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=1,678,272,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8742/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,678,464,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8743/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,678,656,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8744/500000] + train/ActionL1Loss=0.0574 + throughput/total_tokens=1,678,848,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8745/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=1,679,040,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8746/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=1,679,232,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8747/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,679,424,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8748/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,679,616,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8749/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,679,808,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8750/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,680,000,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8751/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=1,680,192,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8752/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=1,680,384,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8753/500000] + train/ActionL1Loss=0.0316 + throughput/total_tokens=1,680,576,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8754/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,680,768,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8755/500000] + train/ActionL1Loss=0.0310 + throughput/total_tokens=1,680,960,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8756/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=1,681,152,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8757/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=1,681,344,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8758/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=1,681,536,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8759/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,681,728,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8760/500000] + optim/total_grad_norm=8.504 + train/ActionL1Loss=0.0559 + throughput/total_tokens=1,681,920,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8761/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,682,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8762/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=1,682,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8763/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,682,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8764/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,682,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8765/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,682,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8766/500000] + train/ActionL1Loss=0.0642 + throughput/total_tokens=1,683,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8767/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=1,683,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8768/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,683,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8769/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,683,648,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8770/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,683,840,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8771/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,684,032,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8772/500000] + train/ActionL1Loss=0.0359 + throughput/total_tokens=1,684,224,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8773/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,684,416,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8774/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,684,608,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8775/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,684,800,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8776/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=1,684,992,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8777/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=1,685,184,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8778/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=1,685,376,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8779/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,685,568,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8780/500000] + optim/total_grad_norm=7.451 + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,685,760,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8781/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=1,685,952,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8782/500000] + train/ActionL1Loss=0.0585 + throughput/total_tokens=1,686,144,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8783/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=1,686,336,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8784/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=1,686,528,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8785/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=1,686,720,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8786/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=1,686,912,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8787/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,687,104,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8788/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=1,687,296,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8789/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=1,687,488,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8790/500000] + train/ActionL1Loss=0.0213 + throughput/total_tokens=1,687,680,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8791/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=1,687,872,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8792/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=1,688,064,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8793/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=1,688,256,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8794/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=1,688,448,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8795/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,688,640,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8796/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,688,832,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8797/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,689,024,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8798/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=1,689,216,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8799/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,689,408,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8800/500000] + optim/total_grad_norm=7.654 + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,689,600,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8801/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,689,792,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8802/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,689,984,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8803/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,690,176,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8804/500000] + train/ActionL1Loss=0.0337 + throughput/total_tokens=1,690,368,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8805/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,690,560,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8806/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=1,690,752,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8807/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=1,690,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8808/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,691,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8809/500000] + train/ActionL1Loss=0.0329 + throughput/total_tokens=1,691,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8810/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=1,691,520,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8811/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,691,712,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8812/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,691,904,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8813/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=1,692,096,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8814/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,692,288,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8815/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=1,692,480,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8816/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=1,692,672,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8817/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=1,692,864,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8818/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=1,693,056,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8819/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=1,693,248,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8820/500000] + optim/total_grad_norm=6.717 + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,693,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8821/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,693,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8822/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=1,693,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8823/500000] + train/ActionL1Loss=0.0312 + throughput/total_tokens=1,694,016,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8824/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,694,208,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8825/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,694,400,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8826/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,694,592,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8827/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,694,784,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8828/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=1,694,976,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8829/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,695,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8830/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,695,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8831/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,695,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8832/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=1,695,744,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8833/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=1,695,936,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8834/500000] + train/ActionL1Loss=0.0682 + throughput/total_tokens=1,696,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8835/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=1,696,320,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8836/500000] + train/ActionL1Loss=0.0277 + throughput/total_tokens=1,696,512,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8837/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=1,696,704,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8838/500000] + train/ActionL1Loss=0.0574 + throughput/total_tokens=1,696,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8839/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,697,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8840/500000] + optim/total_grad_norm=7.604 + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,697,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8841/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,697,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8842/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=1,697,664,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8843/500000] + train/ActionL1Loss=0.0342 + throughput/total_tokens=1,697,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8844/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=1,698,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8845/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=1,698,240,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8846/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=1,698,432,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8847/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,698,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8848/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=1,698,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8849/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=1,699,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8850/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,699,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8851/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=1,699,392,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8852/500000] + train/ActionL1Loss=0.0318 + throughput/total_tokens=1,699,584,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8853/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,699,776,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=8854/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=1,699,968,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8855/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,700,160,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8856/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=1,700,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8857/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,700,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8858/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=1,700,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8859/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,700,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8860/500000] + optim/total_grad_norm=7.945 + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,701,120,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8861/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=1,701,312,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8862/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=1,701,504,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8863/500000] + train/ActionL1Loss=0.0714 + throughput/total_tokens=1,701,696,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8864/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,701,888,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8865/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,702,080,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8866/500000] + train/ActionL1Loss=0.0639 + throughput/total_tokens=1,702,272,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8867/500000] + train/ActionL1Loss=0.0600 + throughput/total_tokens=1,702,464,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8868/500000] + train/ActionL1Loss=0.0618 + throughput/total_tokens=1,702,656,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8869/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=1,702,848,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8870/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,703,040,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=8871/500000] + train/ActionL1Loss=0.0337 + throughput/total_tokens=1,703,232,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=8872/500000] + train/ActionL1Loss=0.0335 + throughput/total_tokens=1,703,424,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=8873/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,703,616,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=8874/500000] + train/ActionL1Loss=0.0372 + throughput/total_tokens=1,703,808,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=8875/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,704,000,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=8876/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,704,192,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=8877/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,704,384,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=8878/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,704,576,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=8879/500000] + train/ActionL1Loss=0.0292 + throughput/total_tokens=1,704,768,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8880/500000] + optim/total_grad_norm=8.241 + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,704,960,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8881/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=1,705,152,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8882/500000] + train/ActionL1Loss=0.0254 + throughput/total_tokens=1,705,344,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8883/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=1,705,536,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8884/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,705,728,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8885/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=1,705,920,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8886/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,706,112,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8887/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,706,304,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8888/500000] + train/ActionL1Loss=0.0301 + throughput/total_tokens=1,706,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8889/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,706,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8890/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,706,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8891/500000] + train/ActionL1Loss=0.0228 + throughput/total_tokens=1,707,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8892/500000] + train/ActionL1Loss=0.0627 + throughput/total_tokens=1,707,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8893/500000] + train/ActionL1Loss=0.0636 + throughput/total_tokens=1,707,456,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8894/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=1,707,648,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8895/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=1,707,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8896/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=1,708,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8897/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,708,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8898/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,708,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8899/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,708,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8900/500000] + optim/total_grad_norm=7.453 + train/ActionL1Loss=0.0332 + throughput/total_tokens=1,708,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8901/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,708,992,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8902/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=1,709,184,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8903/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=1,709,376,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8904/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,709,568,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8905/500000] + train/ActionL1Loss=0.0319 + throughput/total_tokens=1,709,760,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8906/500000] + train/ActionL1Loss=0.0342 + throughput/total_tokens=1,709,952,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8907/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=1,710,144,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8908/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=1,710,336,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8909/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,710,528,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8910/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=1,710,720,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=8911/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=1,710,912,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8912/500000] + train/ActionL1Loss=0.0369 + throughput/total_tokens=1,711,104,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8913/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,711,296,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8914/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,711,488,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8915/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=1,711,680,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8916/500000] + train/ActionL1Loss=0.0356 + throughput/total_tokens=1,711,872,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8917/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,712,064,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8918/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=1,712,256,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8919/500000] + train/ActionL1Loss=0.0328 + throughput/total_tokens=1,712,448,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=8920/500000] + optim/total_grad_norm=9.586 + train/ActionL1Loss=0.0606 + throughput/total_tokens=1,712,640,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8921/500000] + train/ActionL1Loss=0.0689 + throughput/total_tokens=1,712,832,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8922/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,713,024,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8923/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=1,713,216,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8924/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=1,713,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8925/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=1,713,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8926/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=1,713,792,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8927/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,713,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8928/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,714,176,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8929/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,714,368,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8930/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,714,560,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8931/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=1,714,752,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8932/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=1,714,944,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8933/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,715,136,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8934/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,715,328,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8935/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,715,520,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8936/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=1,715,712,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8937/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=1,715,904,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8938/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=1,716,096,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8939/500000] + train/ActionL1Loss=0.0334 + throughput/total_tokens=1,716,288,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8940/500000] + optim/total_grad_norm=8.206 + train/ActionL1Loss=0.0365 + throughput/total_tokens=1,716,480,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8941/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,716,672,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8942/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,716,864,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8943/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,717,056,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8944/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,717,248,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8945/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=1,717,440,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8946/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,717,632,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8947/500000] + train/ActionL1Loss=0.0584 + throughput/total_tokens=1,717,824,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8948/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,718,016,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8949/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=1,718,208,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=8950/500000] + train/ActionL1Loss=0.0369 + throughput/total_tokens=1,718,400,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8951/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=1,718,592,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8952/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=1,718,784,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8953/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,718,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8954/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=1,719,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8955/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,719,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8956/500000] + train/ActionL1Loss=0.0334 + throughput/total_tokens=1,719,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8957/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,719,744,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8958/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=1,719,936,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8959/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=1,720,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8960/500000] + optim/total_grad_norm=7.144 + train/ActionL1Loss=0.0380 + throughput/total_tokens=1,720,320,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=8961/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,720,512,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8962/500000] + train/ActionL1Loss=0.0588 + throughput/total_tokens=1,720,704,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=8963/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,720,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8964/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,721,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8965/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,721,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=8966/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,721,472,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8967/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=1,721,664,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8968/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=1,721,856,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=8969/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,722,048,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=8970/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,722,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8971/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=1,722,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8972/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,722,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8973/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,722,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8974/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,723,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=8975/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,723,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8976/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=1,723,392,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8977/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,723,584,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8978/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,723,776,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8979/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=1,723,968,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=8980/500000] + optim/total_grad_norm=9.507 + train/ActionL1Loss=0.0742 + throughput/total_tokens=1,724,160,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8981/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=1,724,352,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8982/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,724,544,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8983/500000] + train/ActionL1Loss=0.0327 + throughput/total_tokens=1,724,736,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8984/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,724,928,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8985/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,725,120,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8986/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=1,725,312,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8987/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=1,725,504,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8988/500000] + train/ActionL1Loss=0.0307 + throughput/total_tokens=1,725,696,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8989/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,725,888,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8990/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=1,726,080,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=8991/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,726,272,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8992/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=1,726,464,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8993/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=1,726,656,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8994/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=1,726,848,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8995/500000] + train/ActionL1Loss=0.0313 + throughput/total_tokens=1,727,040,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8996/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=1,727,232,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8997/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,727,424,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8998/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,727,616,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=8999/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=1,727,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9000/500000] + optim/total_grad_norm=9.192 + train/ActionL1Loss=0.0374 + throughput/total_tokens=1,728,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +10/13 [21:00:20] INFO | >> Saving config... checkpoint.py:608 +10/13 [21:01:20] INFO | >> Saving model state... checkpoint.py:796 +10/13 [21:02:27] INFO | >> Saving optim state... checkpoint.py:811 +10/13 [21:04:00] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=9001/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,728,192,000 + throughput/device/tokens_per_second=1,212 + throughput/device/batches_per_second=0.0505 +[step=9002/500000] + train/ActionL1Loss=0.0606 + throughput/total_tokens=1,728,384,000 + throughput/device/tokens_per_second=1,195 + throughput/device/batches_per_second=0.0498 +[step=9003/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,728,576,000 + throughput/device/tokens_per_second=1,189 + throughput/device/batches_per_second=0.0496 +[step=9004/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=1,728,768,000 + throughput/device/tokens_per_second=1,187 + throughput/device/batches_per_second=0.0495 +[step=9005/500000] + train/ActionL1Loss=0.0317 + throughput/total_tokens=1,728,960,000 + throughput/device/tokens_per_second=1,185 + throughput/device/batches_per_second=0.0494 +[step=9006/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=1,729,152,000 + throughput/device/tokens_per_second=1,186 + throughput/device/batches_per_second=0.0494 +[step=9007/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,729,344,000 + throughput/device/tokens_per_second=1,185 + throughput/device/batches_per_second=0.0494 +[step=9008/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,729,536,000 + throughput/device/tokens_per_second=1,184 + throughput/device/batches_per_second=0.0494 +[step=9009/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,729,728,000 + throughput/device/tokens_per_second=1,184 + throughput/device/batches_per_second=0.0494 +[step=9010/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,729,920,000 + throughput/device/tokens_per_second=1,185 + throughput/device/batches_per_second=0.0494 + System/Peak GPU Memory (MB)=46,924 +[step=9011/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=1,730,112,000 + throughput/device/tokens_per_second=1,184 + throughput/device/batches_per_second=0.0493 +[step=9012/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=1,730,304,000 + throughput/device/tokens_per_second=1,184 + throughput/device/batches_per_second=0.0493 +[step=9013/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=1,730,496,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=9014/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,730,688,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=9015/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=1,730,880,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=9016/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,731,072,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=9017/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=1,731,264,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=9018/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,731,456,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=9019/500000] + train/ActionL1Loss=0.0348 + throughput/total_tokens=1,731,648,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=9020/500000] + optim/total_grad_norm=7.725 + train/ActionL1Loss=0.0342 + throughput/total_tokens=1,731,840,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9021/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,732,032,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9022/500000] + train/ActionL1Loss=0.0316 + throughput/total_tokens=1,732,224,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9023/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,732,416,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9024/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,732,608,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9025/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=1,732,800,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9026/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=1,732,992,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9027/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,733,184,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9028/500000] + train/ActionL1Loss=0.0306 + throughput/total_tokens=1,733,376,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9029/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,733,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9030/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=1,733,760,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9031/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,733,952,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9032/500000] + train/ActionL1Loss=0.0287 + throughput/total_tokens=1,734,144,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9033/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,734,336,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9034/500000] + train/ActionL1Loss=0.0253 + throughput/total_tokens=1,734,528,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9035/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,734,720,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9036/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=1,734,912,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9037/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=1,735,104,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9038/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=1,735,296,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9039/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,735,488,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9040/500000] + optim/total_grad_norm=8.734 + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,735,680,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9041/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=1,735,872,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9042/500000] + train/ActionL1Loss=0.0342 + throughput/total_tokens=1,736,064,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9043/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,736,256,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9044/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=1,736,448,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9045/500000] + train/ActionL1Loss=0.0288 + throughput/total_tokens=1,736,640,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9046/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=1,736,832,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9047/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=1,737,024,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9048/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,737,216,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9049/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=1,737,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9050/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=1,737,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9051/500000] + train/ActionL1Loss=0.0585 + throughput/total_tokens=1,737,792,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9052/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,737,984,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9053/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=1,738,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9054/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,738,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9055/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=1,738,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9056/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=1,738,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9057/500000] + train/ActionL1Loss=0.0639 + throughput/total_tokens=1,738,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9058/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,739,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9059/500000] + train/ActionL1Loss=0.0350 + throughput/total_tokens=1,739,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9060/500000] + optim/total_grad_norm=9.631 + train/ActionL1Loss=0.0303 + throughput/total_tokens=1,739,520,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9061/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=1,739,712,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9062/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,739,904,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9063/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=1,740,096,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9064/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=1,740,288,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9065/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=1,740,480,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9066/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,740,672,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9067/500000] + train/ActionL1Loss=0.0312 + throughput/total_tokens=1,740,864,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9068/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,741,056,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9069/500000] + train/ActionL1Loss=0.0324 + throughput/total_tokens=1,741,248,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9070/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=1,741,440,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9071/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=1,741,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9072/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=1,741,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9073/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=1,742,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9074/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=1,742,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9075/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=1,742,400,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9076/500000] + train/ActionL1Loss=0.0314 + throughput/total_tokens=1,742,592,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9077/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,742,784,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9078/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=1,742,976,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9079/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,743,168,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9080/500000] + optim/total_grad_norm=7.810 + train/ActionL1Loss=0.0286 + throughput/total_tokens=1,743,360,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9081/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,743,552,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9082/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,743,744,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9083/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=1,743,936,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9084/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,744,128,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9085/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=1,744,320,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9086/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=1,744,512,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9087/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,744,704,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9088/500000] + train/ActionL1Loss=0.0249 + throughput/total_tokens=1,744,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9089/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=1,745,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9090/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=1,745,280,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9091/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,745,472,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9092/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=1,745,664,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9093/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=1,745,856,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9094/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,746,048,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9095/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,746,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9096/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,746,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9097/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,746,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9098/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,746,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9099/500000] + train/ActionL1Loss=0.0587 + throughput/total_tokens=1,747,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9100/500000] + optim/total_grad_norm=6.483 + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,747,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9101/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,747,392,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9102/500000] + train/ActionL1Loss=0.0373 + throughput/total_tokens=1,747,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9103/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,747,776,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9104/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,747,968,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9105/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=1,748,160,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9106/500000] + train/ActionL1Loss=0.0328 + throughput/total_tokens=1,748,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9107/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=1,748,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9108/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=1,748,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9109/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=1,748,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9110/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,749,120,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9111/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,749,312,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9112/500000] + train/ActionL1Loss=0.0337 + throughput/total_tokens=1,749,504,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9113/500000] + train/ActionL1Loss=0.0337 + throughput/total_tokens=1,749,696,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9114/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=1,749,888,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9115/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=1,750,080,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9116/500000] + train/ActionL1Loss=0.0655 + throughput/total_tokens=1,750,272,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9117/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,750,464,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9118/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=1,750,656,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9119/500000] + train/ActionL1Loss=0.0331 + throughput/total_tokens=1,750,848,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9120/500000] + optim/total_grad_norm=8.320 + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,751,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9121/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=1,751,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9122/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,751,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9123/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=1,751,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9124/500000] + train/ActionL1Loss=0.0286 + throughput/total_tokens=1,751,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9125/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,752,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9126/500000] + train/ActionL1Loss=0.0634 + throughput/total_tokens=1,752,192,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9127/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=1,752,384,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9128/500000] + train/ActionL1Loss=0.0311 + throughput/total_tokens=1,752,576,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9129/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,752,768,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9130/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,752,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9131/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,753,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9132/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,753,344,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9133/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,753,536,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9134/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=1,753,728,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9135/500000] + train/ActionL1Loss=0.0297 + throughput/total_tokens=1,753,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9136/500000] + train/ActionL1Loss=0.0282 + throughput/total_tokens=1,754,112,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9137/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=1,754,304,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9138/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,754,496,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9139/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=1,754,688,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9140/500000] + optim/total_grad_norm=7.629 + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,754,880,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9141/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,755,072,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9142/500000] + train/ActionL1Loss=0.0602 + throughput/total_tokens=1,755,264,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9143/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,755,456,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9144/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,755,648,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9145/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=1,755,840,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9146/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=1,756,032,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9147/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,756,224,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9148/500000] + train/ActionL1Loss=0.0256 + throughput/total_tokens=1,756,416,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9149/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=1,756,608,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9150/500000] + train/ActionL1Loss=0.0259 + throughput/total_tokens=1,756,800,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9151/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,756,992,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9152/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,757,184,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9153/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,757,376,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=9154/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,757,568,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9155/500000] + train/ActionL1Loss=0.0340 + throughput/total_tokens=1,757,760,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9156/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=1,757,952,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9157/500000] + train/ActionL1Loss=0.0607 + throughput/total_tokens=1,758,144,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9158/500000] + train/ActionL1Loss=0.0350 + throughput/total_tokens=1,758,336,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9159/500000] + train/ActionL1Loss=0.0265 + throughput/total_tokens=1,758,528,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9160/500000] + optim/total_grad_norm=7.519 + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,758,720,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9161/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,758,912,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9162/500000] + train/ActionL1Loss=0.0350 + throughput/total_tokens=1,759,104,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=9163/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,759,296,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9164/500000] + train/ActionL1Loss=0.0626 + throughput/total_tokens=1,759,488,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9165/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,759,680,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9166/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,759,872,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9167/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,760,064,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9168/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,760,256,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9169/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=1,760,448,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9170/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,760,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9171/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=1,760,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9172/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=1,761,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9173/500000] + train/ActionL1Loss=0.0328 + throughput/total_tokens=1,761,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9174/500000] + train/ActionL1Loss=0.0230 + throughput/total_tokens=1,761,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9175/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,761,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9176/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,761,792,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9177/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=1,761,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9178/500000] + train/ActionL1Loss=0.0320 + throughput/total_tokens=1,762,176,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9179/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=1,762,368,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9180/500000] + optim/total_grad_norm=7.239 + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,762,560,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9181/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,762,752,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9182/500000] + train/ActionL1Loss=0.0343 + throughput/total_tokens=1,762,944,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9183/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=1,763,136,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9184/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=1,763,328,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9185/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,763,520,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9186/500000] + train/ActionL1Loss=0.0356 + throughput/total_tokens=1,763,712,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9187/500000] + train/ActionL1Loss=0.0640 + throughput/total_tokens=1,763,904,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9188/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,764,096,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9189/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,764,288,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9190/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,764,480,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9191/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,764,672,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9192/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=1,764,864,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9193/500000] + train/ActionL1Loss=0.0277 + throughput/total_tokens=1,765,056,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9194/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=1,765,248,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9195/500000] + train/ActionL1Loss=0.0322 + throughput/total_tokens=1,765,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9196/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,765,632,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9197/500000] + train/ActionL1Loss=0.0255 + throughput/total_tokens=1,765,824,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9198/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,766,016,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9199/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,766,208,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9200/500000] + optim/total_grad_norm=8.998 + train/ActionL1Loss=0.0440 + throughput/total_tokens=1,766,400,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9201/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,766,592,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9202/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,766,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9203/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=1,766,976,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9204/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=1,767,168,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9205/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=1,767,360,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9206/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,767,552,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9207/500000] + train/ActionL1Loss=0.0621 + throughput/total_tokens=1,767,744,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9208/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=1,767,936,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9209/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,768,128,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9210/500000] + train/ActionL1Loss=0.0334 + throughput/total_tokens=1,768,320,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9211/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,768,512,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9212/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,768,704,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9213/500000] + train/ActionL1Loss=0.0283 + throughput/total_tokens=1,768,896,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9214/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=1,769,088,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9215/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,769,280,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9216/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=1,769,472,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9217/500000] + train/ActionL1Loss=0.0348 + throughput/total_tokens=1,769,664,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9218/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,769,856,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9219/500000] + train/ActionL1Loss=0.0654 + throughput/total_tokens=1,770,048,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9220/500000] + optim/total_grad_norm=9.014 + train/ActionL1Loss=0.0373 + throughput/total_tokens=1,770,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9221/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=1,770,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9222/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,770,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9223/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,770,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9224/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,771,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9225/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,771,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9226/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,771,392,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9227/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=1,771,584,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9228/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=1,771,776,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9229/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,771,968,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9230/500000] + train/ActionL1Loss=0.0234 + throughput/total_tokens=1,772,160,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9231/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,772,352,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9232/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=1,772,544,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9233/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=1,772,736,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9234/500000] + train/ActionL1Loss=0.0320 + throughput/total_tokens=1,772,928,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9235/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,773,120,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9236/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,773,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9237/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,773,504,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9238/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,773,696,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9239/500000] + train/ActionL1Loss=0.0276 + throughput/total_tokens=1,773,888,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9240/500000] + optim/total_grad_norm=7.694 + train/ActionL1Loss=0.0498 + throughput/total_tokens=1,774,080,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9241/500000] + train/ActionL1Loss=0.0369 + throughput/total_tokens=1,774,272,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9242/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,774,464,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9243/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,774,656,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9244/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=1,774,848,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9245/500000] + train/ActionL1Loss=0.0336 + throughput/total_tokens=1,775,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9246/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,775,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9247/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=1,775,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9248/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,775,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9249/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=1,775,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9250/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=1,776,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9251/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=1,776,192,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9252/500000] + train/ActionL1Loss=0.0373 + throughput/total_tokens=1,776,384,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9253/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,776,576,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9254/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,776,768,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9255/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,776,960,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9256/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,777,152,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9257/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,777,344,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9258/500000] + train/ActionL1Loss=0.0394 + throughput/total_tokens=1,777,536,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9259/500000] + train/ActionL1Loss=0.0601 + throughput/total_tokens=1,777,728,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9260/500000] + optim/total_grad_norm=8.965 + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,777,920,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9261/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=1,778,112,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9262/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=1,778,304,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9263/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,778,496,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9264/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=1,778,688,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9265/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,778,880,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9266/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=1,779,072,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9267/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,779,264,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9268/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=1,779,456,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9269/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,779,648,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9270/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,779,840,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9271/500000] + train/ActionL1Loss=0.0358 + throughput/total_tokens=1,780,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9272/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,780,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9273/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=1,780,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9274/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=1,780,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9275/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=1,780,800,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9276/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=1,780,992,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9277/500000] + train/ActionL1Loss=0.0256 + throughput/total_tokens=1,781,184,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9278/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=1,781,376,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9279/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=1,781,568,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9280/500000] + optim/total_grad_norm=6.095 + train/ActionL1Loss=0.0352 + throughput/total_tokens=1,781,760,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9281/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=1,781,952,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9282/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,782,144,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9283/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,782,336,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9284/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,782,528,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9285/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,782,720,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9286/500000] + train/ActionL1Loss=0.0336 + throughput/total_tokens=1,782,912,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9287/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,783,104,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9288/500000] + train/ActionL1Loss=0.0275 + throughput/total_tokens=1,783,296,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9289/500000] + train/ActionL1Loss=0.0368 + throughput/total_tokens=1,783,488,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9290/500000] + train/ActionL1Loss=0.0288 + throughput/total_tokens=1,783,680,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9291/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,783,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9292/500000] + train/ActionL1Loss=0.0315 + throughput/total_tokens=1,784,064,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9293/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=1,784,256,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9294/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=1,784,448,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9295/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,784,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9296/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=1,784,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9297/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=1,785,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9298/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,785,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9299/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,785,408,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9300/500000] + optim/total_grad_norm=8.585 + train/ActionL1Loss=0.0369 + throughput/total_tokens=1,785,600,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9301/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,785,792,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9302/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,785,984,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9303/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=1,786,176,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9304/500000] + train/ActionL1Loss=0.0273 + throughput/total_tokens=1,786,368,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9305/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,786,560,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9306/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,786,752,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9307/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,786,944,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9308/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,787,136,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9309/500000] + train/ActionL1Loss=0.0307 + throughput/total_tokens=1,787,328,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=9310/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=1,787,520,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=9311/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=1,787,712,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9312/500000] + train/ActionL1Loss=0.0328 + throughput/total_tokens=1,787,904,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9313/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=1,788,096,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9314/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,788,288,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9315/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,788,480,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=9316/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,788,672,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9317/500000] + train/ActionL1Loss=0.0629 + throughput/total_tokens=1,788,864,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9318/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=1,789,056,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9319/500000] + train/ActionL1Loss=0.0562 + throughput/total_tokens=1,789,248,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9320/500000] + optim/total_grad_norm=9.376 + train/ActionL1Loss=0.0561 + throughput/total_tokens=1,789,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9321/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,789,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9322/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=1,789,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9323/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=1,790,016,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9324/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,790,208,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9325/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=1,790,400,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9326/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,790,592,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9327/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=1,790,784,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9328/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=1,790,976,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9329/500000] + train/ActionL1Loss=0.0295 + throughput/total_tokens=1,791,168,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9330/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=1,791,360,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9331/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=1,791,552,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9332/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=1,791,744,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9333/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,791,936,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9334/500000] + train/ActionL1Loss=0.0656 + throughput/total_tokens=1,792,128,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9335/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,792,320,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9336/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=1,792,512,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9337/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,792,704,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9338/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,792,896,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9339/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,793,088,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9340/500000] + optim/total_grad_norm=6.651 + train/ActionL1Loss=0.0417 + throughput/total_tokens=1,793,280,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9341/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=1,793,472,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9342/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=1,793,664,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9343/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=1,793,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9344/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,794,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9345/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=1,794,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9346/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,794,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9347/500000] + train/ActionL1Loss=0.0270 + throughput/total_tokens=1,794,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9348/500000] + train/ActionL1Loss=0.0269 + throughput/total_tokens=1,794,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9349/500000] + train/ActionL1Loss=0.0227 + throughput/total_tokens=1,795,008,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9350/500000] + train/ActionL1Loss=0.0641 + throughput/total_tokens=1,795,200,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9351/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,795,392,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9352/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,795,584,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9353/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,795,776,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9354/500000] + train/ActionL1Loss=0.0640 + throughput/total_tokens=1,795,968,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=9355/500000] + train/ActionL1Loss=0.0270 + throughput/total_tokens=1,796,160,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9356/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,796,352,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9357/500000] + train/ActionL1Loss=0.0326 + throughput/total_tokens=1,796,544,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9358/500000] + train/ActionL1Loss=0.0302 + throughput/total_tokens=1,796,736,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=9359/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,796,928,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9360/500000] + optim/total_grad_norm=8.421 + train/ActionL1Loss=0.0555 + throughput/total_tokens=1,797,120,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9361/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,797,312,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9362/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=1,797,504,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9363/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=1,797,696,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9364/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=1,797,888,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9365/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,798,080,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9366/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=1,798,272,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=9367/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,798,464,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9368/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=1,798,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9369/500000] + train/ActionL1Loss=0.0354 + throughput/total_tokens=1,798,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9370/500000] + train/ActionL1Loss=0.0326 + throughput/total_tokens=1,799,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9371/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,799,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9372/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,799,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9373/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=1,799,616,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9374/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=1,799,808,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9375/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=1,800,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9376/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=1,800,192,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9377/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,800,384,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9378/500000] + train/ActionL1Loss=0.0342 + throughput/total_tokens=1,800,576,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9379/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,800,768,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9380/500000] + optim/total_grad_norm=7.974 + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,800,960,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9381/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=1,801,152,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9382/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,801,344,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9383/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,801,536,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9384/500000] + train/ActionL1Loss=0.0661 + throughput/total_tokens=1,801,728,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9385/500000] + train/ActionL1Loss=0.0564 + throughput/total_tokens=1,801,920,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9386/500000] + train/ActionL1Loss=0.0338 + throughput/total_tokens=1,802,112,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9387/500000] + train/ActionL1Loss=0.0313 + throughput/total_tokens=1,802,304,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9388/500000] + train/ActionL1Loss=0.0344 + throughput/total_tokens=1,802,496,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9389/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=1,802,688,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9390/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,802,880,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9391/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=1,803,072,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9392/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,803,264,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9393/500000] + train/ActionL1Loss=0.0698 + throughput/total_tokens=1,803,456,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9394/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,803,648,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9395/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=1,803,840,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9396/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,804,032,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9397/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,804,224,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9398/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,804,416,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9399/500000] + train/ActionL1Loss=0.0329 + throughput/total_tokens=1,804,608,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9400/500000] + optim/total_grad_norm=7.392 + train/ActionL1Loss=0.0314 + throughput/total_tokens=1,804,800,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9401/500000] + train/ActionL1Loss=0.0336 + throughput/total_tokens=1,804,992,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9402/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,805,184,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9403/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=1,805,376,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9404/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=1,805,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9405/500000] + train/ActionL1Loss=0.0387 + throughput/total_tokens=1,805,760,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9406/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,805,952,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9407/500000] + train/ActionL1Loss=0.0320 + throughput/total_tokens=1,806,144,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9408/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=1,806,336,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9409/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,806,528,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9410/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,806,720,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9411/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=1,806,912,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9412/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,807,104,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9413/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,807,296,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9414/500000] + train/ActionL1Loss=0.0280 + throughput/total_tokens=1,807,488,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9415/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=1,807,680,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9416/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=1,807,872,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9417/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=1,808,064,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9418/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=1,808,256,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9419/500000] + train/ActionL1Loss=0.0340 + throughput/total_tokens=1,808,448,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9420/500000] + optim/total_grad_norm=9.566 + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,808,640,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9421/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,808,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9422/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=1,809,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9423/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,809,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9424/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,809,408,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9425/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,809,600,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9426/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=1,809,792,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9427/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,809,984,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9428/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,810,176,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9429/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,810,368,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9430/500000] + train/ActionL1Loss=0.0625 + throughput/total_tokens=1,810,560,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9431/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=1,810,752,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9432/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,810,944,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9433/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,811,136,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9434/500000] + train/ActionL1Loss=0.0627 + throughput/total_tokens=1,811,328,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9435/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,811,520,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9436/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,811,712,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9437/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,811,904,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9438/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,812,096,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9439/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=1,812,288,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9440/500000] + optim/total_grad_norm=9.392 + train/ActionL1Loss=0.0509 + throughput/total_tokens=1,812,480,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9441/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=1,812,672,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9442/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,812,864,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9443/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=1,813,056,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9444/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=1,813,248,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9445/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=1,813,440,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9446/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,813,632,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9447/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=1,813,824,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9448/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,814,016,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9449/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,814,208,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9450/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=1,814,400,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9451/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,814,592,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9452/500000] + train/ActionL1Loss=0.0348 + throughput/total_tokens=1,814,784,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9453/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=1,814,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9454/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=1,815,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9455/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,815,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9456/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=1,815,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9457/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=1,815,744,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9458/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=1,815,936,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9459/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,816,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9460/500000] + optim/total_grad_norm=8.086 + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,816,320,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9461/500000] + train/ActionL1Loss=0.0652 + throughput/total_tokens=1,816,512,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9462/500000] + train/ActionL1Loss=0.0358 + throughput/total_tokens=1,816,704,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9463/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=1,816,896,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9464/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=1,817,088,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9465/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,817,280,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9466/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,817,472,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9467/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=1,817,664,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9468/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,817,856,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9469/500000] + train/ActionL1Loss=0.0336 + throughput/total_tokens=1,818,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9470/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,818,240,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9471/500000] + train/ActionL1Loss=0.0368 + throughput/total_tokens=1,818,432,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9472/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=1,818,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9473/500000] + train/ActionL1Loss=0.0356 + throughput/total_tokens=1,818,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9474/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=1,819,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9475/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,819,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9476/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=1,819,392,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9477/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=1,819,584,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9478/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,819,776,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9479/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=1,819,968,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9480/500000] + optim/total_grad_norm=9.256 + train/ActionL1Loss=0.0629 + throughput/total_tokens=1,820,160,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9481/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,820,352,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9482/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=1,820,544,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9483/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=1,820,736,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9484/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=1,820,928,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9485/500000] + train/ActionL1Loss=0.0324 + throughput/total_tokens=1,821,120,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9486/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=1,821,312,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9487/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=1,821,504,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9488/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,821,696,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9489/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,821,888,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9490/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=1,822,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9491/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=1,822,272,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9492/500000] + train/ActionL1Loss=0.0610 + throughput/total_tokens=1,822,464,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9493/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,822,656,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9494/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,822,848,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9495/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,823,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9496/500000] + train/ActionL1Loss=0.0635 + throughput/total_tokens=1,823,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9497/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=1,823,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9498/500000] + train/ActionL1Loss=0.0354 + throughput/total_tokens=1,823,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9499/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,823,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9500/500000] + optim/total_grad_norm=8.263 + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,824,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +10/13 [23:55:07] INFO | >> Saving config... checkpoint.py:608 +10/13 [23:55:49] INFO | >> Saving model state... checkpoint.py:796 +10/13 [23:57:01] INFO | >> Saving optim state... checkpoint.py:811 +10/13 [23:58:34] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=9501/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=1,824,192,000 + throughput/device/tokens_per_second=1,210 + throughput/device/batches_per_second=0.0504 +[step=9502/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,824,384,000 + throughput/device/tokens_per_second=1,188 + throughput/device/batches_per_second=0.0495 +[step=9503/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=1,824,576,000 + throughput/device/tokens_per_second=1,187 + throughput/device/batches_per_second=0.0495 +[step=9504/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,824,768,000 + throughput/device/tokens_per_second=1,186 + throughput/device/batches_per_second=0.0494 +[step=9505/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,824,960,000 + throughput/device/tokens_per_second=1,185 + throughput/device/batches_per_second=0.0494 +[step=9506/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,825,152,000 + throughput/device/tokens_per_second=1,185 + throughput/device/batches_per_second=0.0494 +[step=9507/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=1,825,344,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=9508/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,825,536,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=9509/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,825,728,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=9510/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,825,920,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=9511/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=1,826,112,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=9512/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,826,304,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=9513/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,826,496,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=9514/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=1,826,688,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=9515/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=1,826,880,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=9516/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,827,072,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=9517/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,827,264,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9518/500000] + train/ActionL1Loss=0.0345 + throughput/total_tokens=1,827,456,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9519/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=1,827,648,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9520/500000] + optim/total_grad_norm=6.836 + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,827,840,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9521/500000] + train/ActionL1Loss=0.0283 + throughput/total_tokens=1,828,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9522/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,828,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9523/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,828,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9524/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=1,828,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9525/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=1,828,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9526/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,828,992,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9527/500000] + train/ActionL1Loss=0.0306 + throughput/total_tokens=1,829,184,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9528/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=1,829,376,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9529/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,829,568,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9530/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,829,760,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9531/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,829,952,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9532/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=1,830,144,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9533/500000] + train/ActionL1Loss=0.0622 + throughput/total_tokens=1,830,336,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9534/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=1,830,528,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9535/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,830,720,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9536/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=1,830,912,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9537/500000] + train/ActionL1Loss=0.0658 + throughput/total_tokens=1,831,104,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9538/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=1,831,296,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9539/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=1,831,488,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9540/500000] + optim/total_grad_norm=8.695 + train/ActionL1Loss=0.0445 + throughput/total_tokens=1,831,680,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9541/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=1,831,872,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9542/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,832,064,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9543/500000] + train/ActionL1Loss=0.0364 + throughput/total_tokens=1,832,256,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9544/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,832,448,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9545/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=1,832,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9546/500000] + train/ActionL1Loss=0.0387 + throughput/total_tokens=1,832,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9547/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,833,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9548/500000] + train/ActionL1Loss=0.0587 + throughput/total_tokens=1,833,216,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9549/500000] + train/ActionL1Loss=0.0320 + throughput/total_tokens=1,833,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9550/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=1,833,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9551/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=1,833,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9552/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=1,833,984,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9553/500000] + train/ActionL1Loss=0.0339 + throughput/total_tokens=1,834,176,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9554/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,834,368,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9555/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=1,834,560,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9556/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=1,834,752,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9557/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,834,944,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9558/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=1,835,136,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9559/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,835,328,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9560/500000] + optim/total_grad_norm=7.630 + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,835,520,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=9561/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,835,712,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9562/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,835,904,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9563/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,836,096,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9564/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,836,288,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9565/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,836,480,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9566/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=1,836,672,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=9567/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,836,864,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9568/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,837,056,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9569/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,837,248,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9570/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=1,837,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9571/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=1,837,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9572/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=1,837,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9573/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=1,838,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9574/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,838,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9575/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,838,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9576/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,838,592,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9577/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,838,784,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9578/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=1,838,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9579/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=1,839,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9580/500000] + optim/total_grad_norm=7.971 + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,839,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9581/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,839,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9582/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,839,744,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9583/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=1,839,936,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9584/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=1,840,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9585/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=1,840,320,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9586/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,840,512,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9587/500000] + train/ActionL1Loss=0.0315 + throughput/total_tokens=1,840,704,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9588/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,840,896,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9589/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,841,088,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9590/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,841,280,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9591/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,841,472,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9592/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=1,841,664,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9593/500000] + train/ActionL1Loss=0.0632 + throughput/total_tokens=1,841,856,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9594/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=1,842,048,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9595/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,842,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9596/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,842,432,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9597/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=1,842,624,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9598/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,842,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9599/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=1,843,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9600/500000] + optim/total_grad_norm=7.664 + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,843,200,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9601/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,843,392,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9602/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,843,584,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9603/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=1,843,776,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9604/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,843,968,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9605/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=1,844,160,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9606/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,844,352,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9607/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,844,544,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9608/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,844,736,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9609/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=1,844,928,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9610/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,845,120,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9611/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=1,845,312,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9612/500000] + train/ActionL1Loss=0.0308 + throughput/total_tokens=1,845,504,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9613/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,845,696,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9614/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=1,845,888,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9615/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=1,846,080,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9616/500000] + train/ActionL1Loss=0.0644 + throughput/total_tokens=1,846,272,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9617/500000] + train/ActionL1Loss=0.0294 + throughput/total_tokens=1,846,464,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9618/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,846,656,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9619/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,846,848,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9620/500000] + optim/total_grad_norm=8.207 + train/ActionL1Loss=0.0336 + throughput/total_tokens=1,847,040,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9621/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,847,232,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9622/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,847,424,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9623/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=1,847,616,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9624/500000] + train/ActionL1Loss=0.0334 + throughput/total_tokens=1,847,808,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9625/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,848,000,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9626/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=1,848,192,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9627/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=1,848,384,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9628/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=1,848,576,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9629/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,848,768,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9630/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,848,960,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9631/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=1,849,152,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9632/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=1,849,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9633/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=1,849,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9634/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,849,728,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9635/500000] + train/ActionL1Loss=0.0309 + throughput/total_tokens=1,849,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9636/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,850,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9637/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,850,304,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9638/500000] + train/ActionL1Loss=0.0293 + throughput/total_tokens=1,850,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9639/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,850,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9640/500000] + optim/total_grad_norm=7.350 + train/ActionL1Loss=0.0560 + throughput/total_tokens=1,850,880,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9641/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,851,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9642/500000] + train/ActionL1Loss=0.0308 + throughput/total_tokens=1,851,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9643/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=1,851,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9644/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,851,648,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9645/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,851,840,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9646/500000] + train/ActionL1Loss=0.0373 + throughput/total_tokens=1,852,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9647/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=1,852,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9648/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,852,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9649/500000] + train/ActionL1Loss=0.0310 + throughput/total_tokens=1,852,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9650/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=1,852,800,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9651/500000] + train/ActionL1Loss=0.0291 + throughput/total_tokens=1,852,992,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9652/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,853,184,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9653/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=1,853,376,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9654/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=1,853,568,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=9655/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=1,853,760,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9656/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=1,853,952,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=9657/500000] + train/ActionL1Loss=0.0341 + throughput/total_tokens=1,854,144,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9658/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,854,336,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=9659/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=1,854,528,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9660/500000] + optim/total_grad_norm=9.961 + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,854,720,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=9661/500000] + train/ActionL1Loss=0.0355 + throughput/total_tokens=1,854,912,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9662/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=1,855,104,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9663/500000] + train/ActionL1Loss=0.0290 + throughput/total_tokens=1,855,296,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9664/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=1,855,488,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9665/500000] + train/ActionL1Loss=0.0345 + throughput/total_tokens=1,855,680,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9666/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,855,872,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9667/500000] + train/ActionL1Loss=0.0308 + throughput/total_tokens=1,856,064,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=9668/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=1,856,256,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=9669/500000] + train/ActionL1Loss=0.0341 + throughput/total_tokens=1,856,448,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=9670/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,856,640,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9671/500000] + train/ActionL1Loss=0.0323 + throughput/total_tokens=1,856,832,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9672/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,857,024,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9673/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,857,216,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9674/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,857,408,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=9675/500000] + train/ActionL1Loss=0.0302 + throughput/total_tokens=1,857,600,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9676/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=1,857,792,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9677/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=1,857,984,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=9678/500000] + train/ActionL1Loss=0.0637 + throughput/total_tokens=1,858,176,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=9679/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=1,858,368,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=9680/500000] + optim/total_grad_norm=4.804 + train/ActionL1Loss=0.0304 + throughput/total_tokens=1,858,560,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=9681/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,858,752,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=9682/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=1,858,944,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9683/500000] + train/ActionL1Loss=0.0596 + throughput/total_tokens=1,859,136,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9684/500000] + train/ActionL1Loss=0.0302 + throughput/total_tokens=1,859,328,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9685/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,859,520,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=9686/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=1,859,712,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9687/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,859,904,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9688/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=1,860,096,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9689/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=1,860,288,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9690/500000] + train/ActionL1Loss=0.0317 + throughput/total_tokens=1,860,480,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9691/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,860,672,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9692/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,860,864,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9693/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,861,056,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9694/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=1,861,248,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9695/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,861,440,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9696/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,861,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9697/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,861,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9698/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=1,862,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9699/500000] + train/ActionL1Loss=0.0280 + throughput/total_tokens=1,862,208,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9700/500000] + optim/total_grad_norm=9.611 + train/ActionL1Loss=0.0547 + throughput/total_tokens=1,862,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9701/500000] + train/ActionL1Loss=0.0337 + throughput/total_tokens=1,862,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9702/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=1,862,784,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9703/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,862,976,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9704/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=1,863,168,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9705/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=1,863,360,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9706/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,863,552,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9707/500000] + train/ActionL1Loss=0.0622 + throughput/total_tokens=1,863,744,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9708/500000] + train/ActionL1Loss=0.0245 + throughput/total_tokens=1,863,936,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9709/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,864,128,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9710/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=1,864,320,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9711/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=1,864,512,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9712/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,864,704,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9713/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,864,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9714/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=1,865,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9715/500000] + train/ActionL1Loss=0.0647 + throughput/total_tokens=1,865,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9716/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,865,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9717/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=1,865,664,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9718/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=1,865,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9719/500000] + train/ActionL1Loss=0.0373 + throughput/total_tokens=1,866,048,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9720/500000] + optim/total_grad_norm=8.573 + train/ActionL1Loss=0.0329 + throughput/total_tokens=1,866,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9721/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=1,866,432,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9722/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,866,624,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9723/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,866,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9724/500000] + train/ActionL1Loss=0.0335 + throughput/total_tokens=1,867,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9725/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=1,867,200,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9726/500000] + train/ActionL1Loss=0.0188 + throughput/total_tokens=1,867,392,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9727/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,867,584,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9728/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=1,867,776,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9729/500000] + train/ActionL1Loss=0.0387 + throughput/total_tokens=1,867,968,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9730/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,868,160,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9731/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=1,868,352,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9732/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,868,544,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9733/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,868,736,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9734/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=1,868,928,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9735/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,869,120,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9736/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,869,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9737/500000] + train/ActionL1Loss=0.0571 + throughput/total_tokens=1,869,504,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9738/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,869,696,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9739/500000] + train/ActionL1Loss=0.0390 + throughput/total_tokens=1,869,888,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9740/500000] + optim/total_grad_norm=9.111 + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,870,080,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9741/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,870,272,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9742/500000] + train/ActionL1Loss=0.0639 + throughput/total_tokens=1,870,464,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9743/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=1,870,656,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=9744/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,870,848,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=9745/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=1,871,040,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=9746/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=1,871,232,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=9747/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=1,871,424,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=9748/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,871,616,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=9749/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,871,808,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=9750/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,872,000,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=9751/500000] + train/ActionL1Loss=0.0305 + throughput/total_tokens=1,872,192,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9752/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,872,384,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9753/500000] + train/ActionL1Loss=0.0345 + throughput/total_tokens=1,872,576,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9754/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,872,768,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9755/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=1,872,960,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9756/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,873,152,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9757/500000] + train/ActionL1Loss=0.0293 + throughput/total_tokens=1,873,344,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9758/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,873,536,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9759/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,873,728,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9760/500000] + optim/total_grad_norm=9.068 + train/ActionL1Loss=0.0664 + throughput/total_tokens=1,873,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9761/500000] + train/ActionL1Loss=0.0562 + throughput/total_tokens=1,874,112,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9762/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=1,874,304,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9763/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=1,874,496,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9764/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,874,688,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9765/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=1,874,880,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9766/500000] + train/ActionL1Loss=0.0293 + throughput/total_tokens=1,875,072,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9767/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=1,875,264,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9768/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=1,875,456,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9769/500000] + train/ActionL1Loss=0.0320 + throughput/total_tokens=1,875,648,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9770/500000] + train/ActionL1Loss=0.0287 + throughput/total_tokens=1,875,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9771/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=1,876,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9772/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,876,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9773/500000] + train/ActionL1Loss=0.0324 + throughput/total_tokens=1,876,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9774/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,876,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9775/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=1,876,800,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9776/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=1,876,992,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9777/500000] + train/ActionL1Loss=0.0344 + throughput/total_tokens=1,877,184,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9778/500000] + train/ActionL1Loss=0.0387 + throughput/total_tokens=1,877,376,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9779/500000] + train/ActionL1Loss=0.0312 + throughput/total_tokens=1,877,568,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9780/500000] + optim/total_grad_norm=6.345 + train/ActionL1Loss=0.0393 + throughput/total_tokens=1,877,760,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9781/500000] + train/ActionL1Loss=0.0364 + throughput/total_tokens=1,877,952,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9782/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,878,144,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9783/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,878,336,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9784/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=1,878,528,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9785/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=1,878,720,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9786/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=1,878,912,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9787/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=1,879,104,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9788/500000] + train/ActionL1Loss=0.0326 + throughput/total_tokens=1,879,296,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9789/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=1,879,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9790/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=1,879,680,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9791/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=1,879,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9792/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=1,880,064,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9793/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=1,880,256,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9794/500000] + train/ActionL1Loss=0.0278 + throughput/total_tokens=1,880,448,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9795/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,880,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9796/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,880,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9797/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,881,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9798/500000] + train/ActionL1Loss=0.0276 + throughput/total_tokens=1,881,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9799/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,881,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9800/500000] + optim/total_grad_norm=8.721 + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,881,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9801/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=1,881,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9802/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,881,984,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9803/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=1,882,176,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9804/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,882,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9805/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=1,882,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9806/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=1,882,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9807/500000] + train/ActionL1Loss=0.0321 + throughput/total_tokens=1,882,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9808/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,883,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9809/500000] + train/ActionL1Loss=0.0294 + throughput/total_tokens=1,883,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9810/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=1,883,520,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9811/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,883,712,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9812/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,883,904,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9813/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=1,884,096,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9814/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=1,884,288,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9815/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=1,884,480,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9816/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,884,672,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9817/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,884,864,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9818/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,885,056,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=9819/500000] + train/ActionL1Loss=0.0220 + throughput/total_tokens=1,885,248,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9820/500000] + optim/total_grad_norm=9.333 + train/ActionL1Loss=0.0540 + throughput/total_tokens=1,885,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9821/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=1,885,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9822/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,885,824,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9823/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=1,886,016,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9824/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,886,208,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9825/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=1,886,400,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9826/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,886,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9827/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=1,886,784,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9828/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=1,886,976,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9829/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,887,168,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9830/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,887,360,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9831/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,887,552,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9832/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,887,744,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9833/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=1,887,936,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9834/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=1,888,128,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9835/500000] + train/ActionL1Loss=0.0341 + throughput/total_tokens=1,888,320,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9836/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,888,512,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9837/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=1,888,704,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9838/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=1,888,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9839/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,889,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9840/500000] + optim/total_grad_norm=9.132 + train/ActionL1Loss=0.0669 + throughput/total_tokens=1,889,280,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9841/500000] + train/ActionL1Loss=0.0324 + throughput/total_tokens=1,889,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9842/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,889,664,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9843/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=1,889,856,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9844/500000] + train/ActionL1Loss=0.0347 + throughput/total_tokens=1,890,048,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9845/500000] + train/ActionL1Loss=0.0359 + throughput/total_tokens=1,890,240,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9846/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,890,432,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9847/500000] + train/ActionL1Loss=0.0354 + throughput/total_tokens=1,890,624,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9848/500000] + train/ActionL1Loss=0.0262 + throughput/total_tokens=1,890,816,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9849/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,891,008,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9850/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=1,891,200,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9851/500000] + train/ActionL1Loss=0.0333 + throughput/total_tokens=1,891,392,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=9852/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=1,891,584,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9853/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=1,891,776,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9854/500000] + train/ActionL1Loss=0.0293 + throughput/total_tokens=1,891,968,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9855/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,892,160,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9856/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=1,892,352,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9857/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,892,544,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=9858/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=1,892,736,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=9859/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=1,892,928,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=9860/500000] + optim/total_grad_norm=7.736 + train/ActionL1Loss=0.0341 + throughput/total_tokens=1,893,120,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 + System/Peak GPU Memory (MB)=46,924 +[step=9861/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=1,893,312,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=9862/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=1,893,504,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=9863/500000] + train/ActionL1Loss=0.0317 + throughput/total_tokens=1,893,696,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=9864/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=1,893,888,000 + throughput/device/tokens_per_second=1,171 + throughput/device/batches_per_second=0.0488 +[step=9865/500000] + train/ActionL1Loss=0.0609 + throughput/total_tokens=1,894,080,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=9866/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=1,894,272,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=9867/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,894,464,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=9868/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,894,656,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=9869/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,894,848,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=9870/500000] + train/ActionL1Loss=0.0342 + throughput/total_tokens=1,895,040,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9871/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=1,895,232,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9872/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=1,895,424,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9873/500000] + train/ActionL1Loss=0.0305 + throughput/total_tokens=1,895,616,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9874/500000] + train/ActionL1Loss=0.0256 + throughput/total_tokens=1,895,808,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9875/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,896,000,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9876/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=1,896,192,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9877/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=1,896,384,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9878/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=1,896,576,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9879/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=1,896,768,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9880/500000] + optim/total_grad_norm=7.384 + train/ActionL1Loss=0.0386 + throughput/total_tokens=1,896,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9881/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=1,897,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9882/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=1,897,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9883/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,897,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9884/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,897,728,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9885/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=1,897,920,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9886/500000] + train/ActionL1Loss=0.0350 + throughput/total_tokens=1,898,112,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9887/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=1,898,304,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9888/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,898,496,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9889/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,898,688,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9890/500000] + train/ActionL1Loss=0.0606 + throughput/total_tokens=1,898,880,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9891/500000] + train/ActionL1Loss=0.0332 + throughput/total_tokens=1,899,072,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9892/500000] + train/ActionL1Loss=0.0705 + throughput/total_tokens=1,899,264,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9893/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=1,899,456,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9894/500000] + train/ActionL1Loss=0.0614 + throughput/total_tokens=1,899,648,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9895/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,899,840,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9896/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=1,900,032,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9897/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,900,224,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9898/500000] + train/ActionL1Loss=0.0353 + throughput/total_tokens=1,900,416,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9899/500000] + train/ActionL1Loss=0.0373 + throughput/total_tokens=1,900,608,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=9900/500000] + optim/total_grad_norm=8.452 + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,900,800,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9901/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,900,992,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9902/500000] + train/ActionL1Loss=0.0290 + throughput/total_tokens=1,901,184,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9903/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=1,901,376,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9904/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=1,901,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9905/500000] + train/ActionL1Loss=0.0251 + throughput/total_tokens=1,901,760,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9906/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=1,901,952,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9907/500000] + train/ActionL1Loss=0.0310 + throughput/total_tokens=1,902,144,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9908/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=1,902,336,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9909/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=1,902,528,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9910/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,902,720,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9911/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=1,902,912,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=9912/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=1,903,104,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9913/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=1,903,296,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9914/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,903,488,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9915/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=1,903,680,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9916/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,903,872,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9917/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=1,904,064,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9918/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,904,256,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9919/500000] + train/ActionL1Loss=0.0756 + throughput/total_tokens=1,904,448,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=9920/500000] + optim/total_grad_norm=8.225 + train/ActionL1Loss=0.0570 + throughput/total_tokens=1,904,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9921/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,904,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9922/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=1,905,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9923/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=1,905,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9924/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=1,905,408,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9925/500000] + train/ActionL1Loss=0.0265 + throughput/total_tokens=1,905,600,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9926/500000] + train/ActionL1Loss=0.0369 + throughput/total_tokens=1,905,792,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9927/500000] + train/ActionL1Loss=0.0728 + throughput/total_tokens=1,905,984,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9928/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=1,906,176,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9929/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,906,368,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9930/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=1,906,560,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9931/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=1,906,752,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9932/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=1,906,944,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9933/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=1,907,136,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9934/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,907,328,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9935/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=1,907,520,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9936/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,907,712,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9937/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,907,904,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9938/500000] + train/ActionL1Loss=0.0358 + throughput/total_tokens=1,908,096,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9939/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,908,288,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9940/500000] + optim/total_grad_norm=6.793 + train/ActionL1Loss=0.0370 + throughput/total_tokens=1,908,480,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9941/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,908,672,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9942/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,908,864,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9943/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,909,056,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9944/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,909,248,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9945/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=1,909,440,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9946/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=1,909,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9947/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,909,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9948/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=1,910,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9949/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,910,208,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9950/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=1,910,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9951/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,910,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9952/500000] + train/ActionL1Loss=0.0343 + throughput/total_tokens=1,910,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9953/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,910,976,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9954/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,911,168,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9955/500000] + train/ActionL1Loss=0.0305 + throughput/total_tokens=1,911,360,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9956/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=1,911,552,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9957/500000] + train/ActionL1Loss=0.0387 + throughput/total_tokens=1,911,744,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9958/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=1,911,936,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9959/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=1,912,128,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=9960/500000] + optim/total_grad_norm=7.777 + train/ActionL1Loss=0.0656 + throughput/total_tokens=1,912,320,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=9961/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=1,912,512,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9962/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=1,912,704,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9963/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,912,896,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9964/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=1,913,088,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9965/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=1,913,280,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=9966/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=1,913,472,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=9967/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=1,913,664,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9968/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=1,913,856,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9969/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,914,048,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=9970/500000] + train/ActionL1Loss=0.0279 + throughput/total_tokens=1,914,240,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=9971/500000] + train/ActionL1Loss=0.0346 + throughput/total_tokens=1,914,432,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=9972/500000] + train/ActionL1Loss=0.0639 + throughput/total_tokens=1,914,624,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9973/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,914,816,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9974/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=1,915,008,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9975/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,915,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9976/500000] + train/ActionL1Loss=0.0354 + throughput/total_tokens=1,915,392,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9977/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=1,915,584,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9978/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=1,915,776,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=9979/500000] + train/ActionL1Loss=0.0354 + throughput/total_tokens=1,915,968,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9980/500000] + optim/total_grad_norm=8.349 + train/ActionL1Loss=0.0554 + throughput/total_tokens=1,916,160,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=9981/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=1,916,352,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9982/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=1,916,544,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=9983/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=1,916,736,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9984/500000] + train/ActionL1Loss=0.0291 + throughput/total_tokens=1,916,928,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9985/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=1,917,120,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9986/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,917,312,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9987/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,917,504,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9988/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=1,917,696,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9989/500000] + train/ActionL1Loss=0.0287 + throughput/total_tokens=1,917,888,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9990/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,918,080,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=9991/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,918,272,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=9992/500000] + train/ActionL1Loss=0.0285 + throughput/total_tokens=1,918,464,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9993/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=1,918,656,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=9994/500000] + train/ActionL1Loss=0.0271 + throughput/total_tokens=1,918,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9995/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,919,040,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9996/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,919,232,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9997/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=1,919,424,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9998/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=1,919,616,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=9999/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=1,919,808,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10000/500000] + optim/total_grad_norm=8.015 + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,920,000,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +10/14 [02:49:46] INFO | >> Saving config... checkpoint.py:608 +10/14 [02:50:29] INFO | >> Saving model state... checkpoint.py:796 +10/14 [02:51:41] INFO | >> Saving optim state... checkpoint.py:811 +10/14 [02:53:13] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=10001/500000] + train/ActionL1Loss=0.0317 + throughput/total_tokens=1,920,192,000 + throughput/device/tokens_per_second=1,208 + throughput/device/batches_per_second=0.0504 +[step=10002/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,920,384,000 + throughput/device/tokens_per_second=1,194 + throughput/device/batches_per_second=0.0498 +[step=10003/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=1,920,576,000 + throughput/device/tokens_per_second=1,191 + throughput/device/batches_per_second=0.0496 +[step=10004/500000] + train/ActionL1Loss=0.0284 + throughput/total_tokens=1,920,768,000 + throughput/device/tokens_per_second=1,186 + throughput/device/batches_per_second=0.0494 +[step=10005/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=1,920,960,000 + throughput/device/tokens_per_second=1,185 + throughput/device/batches_per_second=0.0494 +[step=10006/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,921,152,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=10007/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=1,921,344,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10008/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=1,921,536,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=10009/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,921,728,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=10010/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,921,920,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=10011/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,922,112,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=10012/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=1,922,304,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10013/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,922,496,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10014/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=1,922,688,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10015/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=1,922,880,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10016/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=1,923,072,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10017/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=1,923,264,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10018/500000] + train/ActionL1Loss=0.0339 + throughput/total_tokens=1,923,456,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10019/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=1,923,648,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10020/500000] + optim/total_grad_norm=10.27 + train/ActionL1Loss=0.0493 + throughput/total_tokens=1,923,840,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10021/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,924,032,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10022/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,924,224,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10023/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=1,924,416,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10024/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,924,608,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10025/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=1,924,800,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10026/500000] + train/ActionL1Loss=0.0296 + throughput/total_tokens=1,924,992,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10027/500000] + train/ActionL1Loss=0.0356 + throughput/total_tokens=1,925,184,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10028/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,925,376,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10029/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,925,568,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10030/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=1,925,760,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10031/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,925,952,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10032/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=1,926,144,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10033/500000] + train/ActionL1Loss=0.0584 + throughput/total_tokens=1,926,336,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10034/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=1,926,528,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10035/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,926,720,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10036/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,926,912,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10037/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,927,104,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10038/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,927,296,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10039/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,927,488,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10040/500000] + optim/total_grad_norm=8.958 + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,927,680,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10041/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=1,927,872,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10042/500000] + train/ActionL1Loss=0.0605 + throughput/total_tokens=1,928,064,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10043/500000] + train/ActionL1Loss=0.0344 + throughput/total_tokens=1,928,256,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10044/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,928,448,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10045/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,928,640,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10046/500000] + train/ActionL1Loss=0.0333 + throughput/total_tokens=1,928,832,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10047/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=1,929,024,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10048/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,929,216,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10049/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,929,408,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10050/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,929,600,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10051/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=1,929,792,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10052/500000] + train/ActionL1Loss=0.0245 + throughput/total_tokens=1,929,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10053/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=1,930,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10054/500000] + train/ActionL1Loss=0.0284 + throughput/total_tokens=1,930,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10055/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,930,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10056/500000] + train/ActionL1Loss=0.0297 + throughput/total_tokens=1,930,752,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10057/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=1,930,944,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10058/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=1,931,136,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=10059/500000] + train/ActionL1Loss=0.0743 + throughput/total_tokens=1,931,328,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10060/500000] + optim/total_grad_norm=7.194 + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,931,520,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=10061/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=1,931,712,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10062/500000] + train/ActionL1Loss=0.0284 + throughput/total_tokens=1,931,904,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10063/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,932,096,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10064/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,932,288,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10065/500000] + train/ActionL1Loss=0.0390 + throughput/total_tokens=1,932,480,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10066/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,932,672,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10067/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,932,864,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10068/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=1,933,056,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10069/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,933,248,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10070/500000] + train/ActionL1Loss=0.0345 + throughput/total_tokens=1,933,440,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=10071/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,933,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10072/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=1,933,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10073/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=1,934,016,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10074/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,934,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10075/500000] + train/ActionL1Loss=0.0342 + throughput/total_tokens=1,934,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10076/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,934,592,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10077/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=1,934,784,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10078/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=1,934,976,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10079/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=1,935,168,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10080/500000] + optim/total_grad_norm=7.917 + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,935,360,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10081/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,935,552,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10082/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,935,744,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10083/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=1,935,936,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10084/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=1,936,128,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10085/500000] + train/ActionL1Loss=0.0324 + throughput/total_tokens=1,936,320,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10086/500000] + train/ActionL1Loss=0.0316 + throughput/total_tokens=1,936,512,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10087/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,936,704,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10088/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=1,936,896,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10089/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=1,937,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10090/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=1,937,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10091/500000] + train/ActionL1Loss=0.0587 + throughput/total_tokens=1,937,472,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10092/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,937,664,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10093/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=1,937,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10094/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,938,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10095/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,938,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10096/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,938,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10097/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,938,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10098/500000] + train/ActionL1Loss=0.0283 + throughput/total_tokens=1,938,816,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10099/500000] + train/ActionL1Loss=0.0354 + throughput/total_tokens=1,939,008,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10100/500000] + optim/total_grad_norm=7.961 + train/ActionL1Loss=0.0387 + throughput/total_tokens=1,939,200,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=10101/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=1,939,392,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10102/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=1,939,584,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=10103/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=1,939,776,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=10104/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=1,939,968,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=10105/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,940,160,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10106/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=1,940,352,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10107/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,940,544,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10108/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,940,736,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10109/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=1,940,928,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10110/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,941,120,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=10111/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=1,941,312,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10112/500000] + train/ActionL1Loss=0.0368 + throughput/total_tokens=1,941,504,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=10113/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,941,696,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10114/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=1,941,888,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10115/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=1,942,080,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10116/500000] + train/ActionL1Loss=0.0311 + throughput/total_tokens=1,942,272,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10117/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=1,942,464,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10118/500000] + train/ActionL1Loss=0.0300 + throughput/total_tokens=1,942,656,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10119/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,942,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10120/500000] + optim/total_grad_norm=8.291 + train/ActionL1Loss=0.0535 + throughput/total_tokens=1,943,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10121/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=1,943,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10122/500000] + train/ActionL1Loss=0.0348 + throughput/total_tokens=1,943,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10123/500000] + train/ActionL1Loss=0.0311 + throughput/total_tokens=1,943,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10124/500000] + train/ActionL1Loss=0.0625 + throughput/total_tokens=1,943,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10125/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,944,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10126/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,944,192,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10127/500000] + train/ActionL1Loss=0.0281 + throughput/total_tokens=1,944,384,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10128/500000] + train/ActionL1Loss=0.0373 + throughput/total_tokens=1,944,576,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10129/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=1,944,768,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10130/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=1,944,960,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10131/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,945,152,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10132/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,945,344,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10133/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=1,945,536,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10134/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=1,945,728,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10135/500000] + train/ActionL1Loss=0.0320 + throughput/total_tokens=1,945,920,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10136/500000] + train/ActionL1Loss=0.0335 + throughput/total_tokens=1,946,112,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10137/500000] + train/ActionL1Loss=0.0343 + throughput/total_tokens=1,946,304,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10138/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,946,496,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10139/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,946,688,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10140/500000] + optim/total_grad_norm=6.497 + train/ActionL1Loss=0.0510 + throughput/total_tokens=1,946,880,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10141/500000] + train/ActionL1Loss=0.0275 + throughput/total_tokens=1,947,072,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10142/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,947,264,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10143/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=1,947,456,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10144/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=1,947,648,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10145/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=1,947,840,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10146/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,948,032,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10147/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,948,224,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10148/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,948,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10149/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=1,948,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10150/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=1,948,800,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10151/500000] + train/ActionL1Loss=0.0263 + throughput/total_tokens=1,948,992,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10152/500000] + train/ActionL1Loss=0.0336 + throughput/total_tokens=1,949,184,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10153/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=1,949,376,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=10154/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,949,568,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10155/500000] + train/ActionL1Loss=0.0564 + throughput/total_tokens=1,949,760,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10156/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,949,952,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10157/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=1,950,144,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10158/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,950,336,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10159/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,950,528,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10160/500000] + optim/total_grad_norm=9.661 + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,950,720,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=10161/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=1,950,912,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10162/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=1,951,104,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10163/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,951,296,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10164/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=1,951,488,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10165/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,951,680,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10166/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=1,951,872,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10167/500000] + train/ActionL1Loss=0.0373 + throughput/total_tokens=1,952,064,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10168/500000] + train/ActionL1Loss=0.0270 + throughput/total_tokens=1,952,256,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10169/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=1,952,448,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10170/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=1,952,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10171/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,952,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10172/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=1,953,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10173/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,953,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10174/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=1,953,408,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10175/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=1,953,600,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10176/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,953,792,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10177/500000] + train/ActionL1Loss=0.0744 + throughput/total_tokens=1,953,984,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10178/500000] + train/ActionL1Loss=0.0354 + throughput/total_tokens=1,954,176,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10179/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=1,954,368,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10180/500000] + optim/total_grad_norm=6.695 + train/ActionL1Loss=0.0322 + throughput/total_tokens=1,954,560,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10181/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,954,752,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10182/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=1,954,944,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10183/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=1,955,136,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10184/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,955,328,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10185/500000] + train/ActionL1Loss=0.0620 + throughput/total_tokens=1,955,520,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10186/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=1,955,712,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10187/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=1,955,904,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10188/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=1,956,096,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10189/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=1,956,288,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10190/500000] + train/ActionL1Loss=0.0387 + throughput/total_tokens=1,956,480,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10191/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,956,672,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10192/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,956,864,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10193/500000] + train/ActionL1Loss=0.0348 + throughput/total_tokens=1,957,056,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10194/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,957,248,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10195/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=1,957,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10196/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=1,957,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10197/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=1,957,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10198/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=1,958,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10199/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=1,958,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10200/500000] + optim/total_grad_norm=8.693 + train/ActionL1Loss=0.0581 + throughput/total_tokens=1,958,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10201/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=1,958,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10202/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=1,958,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10203/500000] + train/ActionL1Loss=0.0222 + throughput/total_tokens=1,958,976,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10204/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,959,168,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10205/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,959,360,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10206/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,959,552,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10207/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=1,959,744,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10208/500000] + train/ActionL1Loss=0.0202 + throughput/total_tokens=1,959,936,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10209/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=1,960,128,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10210/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=1,960,320,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=10211/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=1,960,512,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10212/500000] + train/ActionL1Loss=0.0251 + throughput/total_tokens=1,960,704,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10213/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=1,960,896,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10214/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,961,088,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10215/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=1,961,280,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10216/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,961,472,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10217/500000] + train/ActionL1Loss=0.0355 + throughput/total_tokens=1,961,664,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10218/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,961,856,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10219/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,962,048,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10220/500000] + optim/total_grad_norm=8.882 + train/ActionL1Loss=0.0360 + throughput/total_tokens=1,962,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10221/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=1,962,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10222/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=1,962,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10223/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,962,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10224/500000] + train/ActionL1Loss=0.0342 + throughput/total_tokens=1,963,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10225/500000] + train/ActionL1Loss=0.0322 + throughput/total_tokens=1,963,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10226/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,963,392,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10227/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=1,963,584,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10228/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=1,963,776,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10229/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=1,963,968,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10230/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=1,964,160,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10231/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,964,352,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10232/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=1,964,544,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10233/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=1,964,736,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10234/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=1,964,928,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10235/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=1,965,120,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10236/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=1,965,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10237/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=1,965,504,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10238/500000] + train/ActionL1Loss=0.0633 + throughput/total_tokens=1,965,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10239/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=1,965,888,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10240/500000] + optim/total_grad_norm=8.109 + train/ActionL1Loss=0.0626 + throughput/total_tokens=1,966,080,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10241/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=1,966,272,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10242/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,966,464,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10243/500000] + train/ActionL1Loss=0.0566 + throughput/total_tokens=1,966,656,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10244/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=1,966,848,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10245/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=1,967,040,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10246/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=1,967,232,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10247/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=1,967,424,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10248/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=1,967,616,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10249/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,967,808,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10250/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=1,968,000,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10251/500000] + train/ActionL1Loss=0.0350 + throughput/total_tokens=1,968,192,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10252/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,968,384,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10253/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=1,968,576,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10254/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=1,968,768,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10255/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=1,968,960,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10256/500000] + train/ActionL1Loss=0.0315 + throughput/total_tokens=1,969,152,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10257/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=1,969,344,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10258/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=1,969,536,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10259/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,969,728,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10260/500000] + optim/total_grad_norm=5.669 + train/ActionL1Loss=0.0164 + throughput/total_tokens=1,969,920,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=10261/500000] + train/ActionL1Loss=0.0242 + throughput/total_tokens=1,970,112,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10262/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,970,304,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10263/500000] + train/ActionL1Loss=0.0350 + throughput/total_tokens=1,970,496,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10264/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=1,970,688,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=10265/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=1,970,880,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10266/500000] + train/ActionL1Loss=0.0369 + throughput/total_tokens=1,971,072,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=10267/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,971,264,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=10268/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=1,971,456,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10269/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=1,971,648,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10270/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=1,971,840,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10271/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=1,972,032,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10272/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,972,224,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10273/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=1,972,416,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10274/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,972,608,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10275/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,972,800,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10276/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=1,972,992,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10277/500000] + train/ActionL1Loss=0.0354 + throughput/total_tokens=1,973,184,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10278/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,973,376,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10279/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,973,568,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10280/500000] + optim/total_grad_norm=4.759 + train/ActionL1Loss=0.0438 + throughput/total_tokens=1,973,760,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10281/500000] + train/ActionL1Loss=0.0321 + throughput/total_tokens=1,973,952,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10282/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,974,144,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10283/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=1,974,336,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10284/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=1,974,528,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10285/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=1,974,720,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10286/500000] + train/ActionL1Loss=0.0257 + throughput/total_tokens=1,974,912,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10287/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=1,975,104,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10288/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=1,975,296,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10289/500000] + train/ActionL1Loss=0.0270 + throughput/total_tokens=1,975,488,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10290/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=1,975,680,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10291/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=1,975,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10292/500000] + train/ActionL1Loss=0.0287 + throughput/total_tokens=1,976,064,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10293/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=1,976,256,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10294/500000] + train/ActionL1Loss=0.0358 + throughput/total_tokens=1,976,448,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10295/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=1,976,640,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10296/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=1,976,832,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10297/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,977,024,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10298/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,977,216,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10299/500000] + train/ActionL1Loss=0.0353 + throughput/total_tokens=1,977,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10300/500000] + optim/total_grad_norm=8.732 + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,977,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10301/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=1,977,792,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10302/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,977,984,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10303/500000] + train/ActionL1Loss=0.0294 + throughput/total_tokens=1,978,176,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10304/500000] + train/ActionL1Loss=0.0359 + throughput/total_tokens=1,978,368,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10305/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=1,978,560,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10306/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=1,978,752,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10307/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=1,978,944,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=10308/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=1,979,136,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10309/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=1,979,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10310/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=1,979,520,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=10311/500000] + train/ActionL1Loss=0.0301 + throughput/total_tokens=1,979,712,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10312/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=1,979,904,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10313/500000] + train/ActionL1Loss=0.0390 + throughput/total_tokens=1,980,096,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10314/500000] + train/ActionL1Loss=0.0320 + throughput/total_tokens=1,980,288,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10315/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,980,480,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10316/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=1,980,672,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10317/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=1,980,864,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10318/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=1,981,056,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10319/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=1,981,248,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10320/500000] + optim/total_grad_norm=8.129 + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,981,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10321/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=1,981,632,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10322/500000] + train/ActionL1Loss=0.0299 + throughput/total_tokens=1,981,824,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10323/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=1,982,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10324/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=1,982,208,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10325/500000] + train/ActionL1Loss=0.0626 + throughput/total_tokens=1,982,400,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10326/500000] + train/ActionL1Loss=0.0556 + throughput/total_tokens=1,982,592,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10327/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,982,784,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10328/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,982,976,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10329/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=1,983,168,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10330/500000] + train/ActionL1Loss=0.0657 + throughput/total_tokens=1,983,360,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10331/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=1,983,552,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10332/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,983,744,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10333/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,983,936,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10334/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=1,984,128,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10335/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=1,984,320,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10336/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=1,984,512,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10337/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=1,984,704,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10338/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=1,984,896,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10339/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=1,985,088,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10340/500000] + optim/total_grad_norm=8.757 + train/ActionL1Loss=0.0401 + throughput/total_tokens=1,985,280,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10341/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=1,985,472,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10342/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=1,985,664,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10343/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=1,985,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10344/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=1,986,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10345/500000] + train/ActionL1Loss=0.0322 + throughput/total_tokens=1,986,240,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10346/500000] + train/ActionL1Loss=0.0219 + throughput/total_tokens=1,986,432,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10347/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=1,986,624,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10348/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=1,986,816,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10349/500000] + train/ActionL1Loss=0.0315 + throughput/total_tokens=1,987,008,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10350/500000] + train/ActionL1Loss=0.0670 + throughput/total_tokens=1,987,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10351/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,987,392,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10352/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,987,584,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=10353/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=1,987,776,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10354/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=1,987,968,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10355/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=1,988,160,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10356/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=1,988,352,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10357/500000] + train/ActionL1Loss=0.0305 + throughput/total_tokens=1,988,544,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10358/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=1,988,736,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10359/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=1,988,928,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10360/500000] + optim/total_grad_norm=6.558 + train/ActionL1Loss=0.0404 + throughput/total_tokens=1,989,120,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=10361/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=1,989,312,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10362/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=1,989,504,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10363/500000] + train/ActionL1Loss=0.0564 + throughput/total_tokens=1,989,696,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10364/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,989,888,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10365/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=1,990,080,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10366/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=1,990,272,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10367/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=1,990,464,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10368/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=1,990,656,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10369/500000] + train/ActionL1Loss=0.0264 + throughput/total_tokens=1,990,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10370/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=1,991,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10371/500000] + train/ActionL1Loss=0.0304 + throughput/total_tokens=1,991,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10372/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=1,991,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10373/500000] + train/ActionL1Loss=0.0339 + throughput/total_tokens=1,991,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10374/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=1,991,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10375/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=1,992,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10376/500000] + train/ActionL1Loss=0.0307 + throughput/total_tokens=1,992,192,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10377/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=1,992,384,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10378/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=1,992,576,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10379/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=1,992,768,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10380/500000] + optim/total_grad_norm=7.875 + train/ActionL1Loss=0.0502 + throughput/total_tokens=1,992,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10381/500000] + train/ActionL1Loss=0.0312 + throughput/total_tokens=1,993,152,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10382/500000] + train/ActionL1Loss=0.0340 + throughput/total_tokens=1,993,344,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10383/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=1,993,536,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10384/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=1,993,728,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10385/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=1,993,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10386/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=1,994,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10387/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=1,994,304,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10388/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,994,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10389/500000] + train/ActionL1Loss=0.0359 + throughput/total_tokens=1,994,688,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10390/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=1,994,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10391/500000] + train/ActionL1Loss=0.0346 + throughput/total_tokens=1,995,072,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10392/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=1,995,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10393/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=1,995,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10394/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=1,995,648,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10395/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=1,995,840,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10396/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,996,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10397/500000] + train/ActionL1Loss=0.0390 + throughput/total_tokens=1,996,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10398/500000] + train/ActionL1Loss=0.0327 + throughput/total_tokens=1,996,416,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10399/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=1,996,608,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10400/500000] + optim/total_grad_norm=8.811 + train/ActionL1Loss=0.0626 + throughput/total_tokens=1,996,800,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10401/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=1,996,992,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10402/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=1,997,184,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10403/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=1,997,376,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10404/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=1,997,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10405/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=1,997,760,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10406/500000] + train/ActionL1Loss=0.0325 + throughput/total_tokens=1,997,952,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10407/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=1,998,144,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10408/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=1,998,336,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10409/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=1,998,528,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10410/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=1,998,720,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10411/500000] + train/ActionL1Loss=0.0349 + throughput/total_tokens=1,998,912,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10412/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=1,999,104,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10413/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=1,999,296,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10414/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=1,999,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10415/500000] + train/ActionL1Loss=0.0599 + throughput/total_tokens=1,999,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10416/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=1,999,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10417/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=2,000,064,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10418/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=2,000,256,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10419/500000] + train/ActionL1Loss=0.0629 + throughput/total_tokens=2,000,448,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10420/500000] + optim/total_grad_norm=7.954 + train/ActionL1Loss=0.0528 + throughput/total_tokens=2,000,640,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10421/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=2,000,832,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10422/500000] + train/ActionL1Loss=0.0351 + throughput/total_tokens=2,001,024,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10423/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=2,001,216,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10424/500000] + train/ActionL1Loss=0.0326 + throughput/total_tokens=2,001,408,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10425/500000] + train/ActionL1Loss=0.0338 + throughput/total_tokens=2,001,600,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10426/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=2,001,792,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10427/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=2,001,984,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10428/500000] + train/ActionL1Loss=0.0346 + throughput/total_tokens=2,002,176,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10429/500000] + train/ActionL1Loss=0.0630 + throughput/total_tokens=2,002,368,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10430/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=2,002,560,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=10431/500000] + train/ActionL1Loss=0.0530 + throughput/total_tokens=2,002,752,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10432/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=2,002,944,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10433/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=2,003,136,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10434/500000] + train/ActionL1Loss=0.0616 + throughput/total_tokens=2,003,328,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10435/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=2,003,520,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10436/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=2,003,712,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10437/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=2,003,904,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10438/500000] + train/ActionL1Loss=0.0342 + throughput/total_tokens=2,004,096,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10439/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=2,004,288,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10440/500000] + optim/total_grad_norm=8.872 + train/ActionL1Loss=0.0351 + throughput/total_tokens=2,004,480,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10441/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=2,004,672,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10442/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=2,004,864,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10443/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=2,005,056,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10444/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=2,005,248,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10445/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=2,005,440,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10446/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=2,005,632,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10447/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=2,005,824,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10448/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=2,006,016,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10449/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=2,006,208,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10450/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=2,006,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10451/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=2,006,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10452/500000] + train/ActionL1Loss=0.0268 + throughput/total_tokens=2,006,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10453/500000] + train/ActionL1Loss=0.0355 + throughput/total_tokens=2,006,976,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10454/500000] + train/ActionL1Loss=0.0199 + throughput/total_tokens=2,007,168,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10455/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=2,007,360,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10456/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=2,007,552,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10457/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=2,007,744,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10458/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=2,007,936,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10459/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=2,008,128,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=10460/500000] + optim/total_grad_norm=7.287 + train/ActionL1Loss=0.0365 + throughput/total_tokens=2,008,320,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=10461/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=2,008,512,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10462/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=2,008,704,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10463/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=2,008,896,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10464/500000] + train/ActionL1Loss=0.0170 + throughput/total_tokens=2,009,088,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10465/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=2,009,280,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=10466/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=2,009,472,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=10467/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=2,009,664,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=10468/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=2,009,856,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=10469/500000] + train/ActionL1Loss=0.0333 + throughput/total_tokens=2,010,048,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=10470/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=2,010,240,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=10471/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=2,010,432,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10472/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=2,010,624,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10473/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=2,010,816,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10474/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=2,011,008,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10475/500000] + train/ActionL1Loss=0.0304 + throughput/total_tokens=2,011,200,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10476/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=2,011,392,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10477/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=2,011,584,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10478/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=2,011,776,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10479/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=2,011,968,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10480/500000] + optim/total_grad_norm=7.101 + train/ActionL1Loss=0.0416 + throughput/total_tokens=2,012,160,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=10481/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=2,012,352,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10482/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=2,012,544,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10483/500000] + train/ActionL1Loss=0.0368 + throughput/total_tokens=2,012,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10484/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=2,012,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10485/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=2,013,120,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10486/500000] + train/ActionL1Loss=0.0587 + throughput/total_tokens=2,013,312,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10487/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=2,013,504,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10488/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=2,013,696,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10489/500000] + train/ActionL1Loss=0.0358 + throughput/total_tokens=2,013,888,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10490/500000] + train/ActionL1Loss=0.0288 + throughput/total_tokens=2,014,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=10491/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=2,014,272,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10492/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=2,014,464,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10493/500000] + train/ActionL1Loss=0.0695 + throughput/total_tokens=2,014,656,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10494/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=2,014,848,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10495/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=2,015,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10496/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=2,015,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10497/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=2,015,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10498/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=2,015,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10499/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=2,015,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10500/500000] + optim/total_grad_norm=7.670 + train/ActionL1Loss=0.0480 + throughput/total_tokens=2,016,000,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +10/14 [05:44:18] INFO | >> Saving config... checkpoint.py:608 +10/14 [05:45:04] INFO | >> Saving model state... checkpoint.py:796 +10/14 [05:46:16] INFO | >> Saving optim state... checkpoint.py:811 +10/14 [05:47:50] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=10501/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=2,016,192,000 + throughput/device/tokens_per_second=1,207 + throughput/device/batches_per_second=0.0503 +[step=10502/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=2,016,384,000 + throughput/device/tokens_per_second=1,185 + throughput/device/batches_per_second=0.0494 +[step=10503/500000] + train/ActionL1Loss=0.0608 + throughput/total_tokens=2,016,576,000 + throughput/device/tokens_per_second=1,185 + throughput/device/batches_per_second=0.0494 +[step=10504/500000] + train/ActionL1Loss=0.0654 + throughput/total_tokens=2,016,768,000 + throughput/device/tokens_per_second=1,186 + throughput/device/batches_per_second=0.0494 +[step=10505/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=2,016,960,000 + throughput/device/tokens_per_second=1,185 + throughput/device/batches_per_second=0.0494 +[step=10506/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=2,017,152,000 + throughput/device/tokens_per_second=1,184 + throughput/device/batches_per_second=0.0493 +[step=10507/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=2,017,344,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=10508/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=2,017,536,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=10509/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=2,017,728,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10510/500000] + train/ActionL1Loss=0.0607 + throughput/total_tokens=2,017,920,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=10511/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,018,112,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=10512/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=2,018,304,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 +[step=10513/500000] + train/ActionL1Loss=0.0241 + throughput/total_tokens=2,018,496,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10514/500000] + train/ActionL1Loss=0.0359 + throughput/total_tokens=2,018,688,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10515/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=2,018,880,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10516/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=2,019,072,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10517/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=2,019,264,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10518/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=2,019,456,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10519/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=2,019,648,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10520/500000] + optim/total_grad_norm=7.406 + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,019,840,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10521/500000] + train/ActionL1Loss=0.0390 + throughput/total_tokens=2,020,032,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10522/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=2,020,224,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10523/500000] + train/ActionL1Loss=0.0258 + throughput/total_tokens=2,020,416,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10524/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=2,020,608,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10525/500000] + train/ActionL1Loss=0.0656 + throughput/total_tokens=2,020,800,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10526/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=2,020,992,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10527/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=2,021,184,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10528/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=2,021,376,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10529/500000] + train/ActionL1Loss=0.0229 + throughput/total_tokens=2,021,568,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10530/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=2,021,760,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10531/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=2,021,952,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10532/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=2,022,144,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10533/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=2,022,336,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10534/500000] + train/ActionL1Loss=0.0625 + throughput/total_tokens=2,022,528,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10535/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=2,022,720,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10536/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=2,022,912,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10537/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=2,023,104,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10538/500000] + train/ActionL1Loss=0.0351 + throughput/total_tokens=2,023,296,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10539/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=2,023,488,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10540/500000] + optim/total_grad_norm=9.250 + train/ActionL1Loss=0.0494 + throughput/total_tokens=2,023,680,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=10541/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=2,023,872,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10542/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=2,024,064,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10543/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=2,024,256,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10544/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=2,024,448,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10545/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=2,024,640,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10546/500000] + train/ActionL1Loss=0.0333 + throughput/total_tokens=2,024,832,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10547/500000] + train/ActionL1Loss=0.0292 + throughput/total_tokens=2,025,024,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10548/500000] + train/ActionL1Loss=0.0321 + throughput/total_tokens=2,025,216,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10549/500000] + train/ActionL1Loss=0.0616 + throughput/total_tokens=2,025,408,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10550/500000] + train/ActionL1Loss=0.0318 + throughput/total_tokens=2,025,600,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10551/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=2,025,792,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10552/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=2,025,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10553/500000] + train/ActionL1Loss=0.0288 + throughput/total_tokens=2,026,176,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10554/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=2,026,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10555/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=2,026,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10556/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=2,026,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10557/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=2,026,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10558/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=2,027,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10559/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=2,027,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10560/500000] + optim/total_grad_norm=7.474 + train/ActionL1Loss=0.0339 + throughput/total_tokens=2,027,520,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=10561/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=2,027,712,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10562/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=2,027,904,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10563/500000] + train/ActionL1Loss=0.0232 + throughput/total_tokens=2,028,096,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10564/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=2,028,288,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10565/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=2,028,480,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10566/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=2,028,672,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10567/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=2,028,864,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10568/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=2,029,056,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10569/500000] + train/ActionL1Loss=0.0344 + throughput/total_tokens=2,029,248,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10570/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=2,029,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10571/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=2,029,632,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10572/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=2,029,824,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10573/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=2,030,016,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10574/500000] + train/ActionL1Loss=0.0348 + throughput/total_tokens=2,030,208,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10575/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=2,030,400,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10576/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=2,030,592,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10577/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=2,030,784,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10578/500000] + train/ActionL1Loss=0.0338 + throughput/total_tokens=2,030,976,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10579/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=2,031,168,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10580/500000] + optim/total_grad_norm=8.462 + train/ActionL1Loss=0.0321 + throughput/total_tokens=2,031,360,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10581/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=2,031,552,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10582/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=2,031,744,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10583/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=2,031,936,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10584/500000] + train/ActionL1Loss=0.0623 + throughput/total_tokens=2,032,128,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10585/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=2,032,320,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10586/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=2,032,512,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10587/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=2,032,704,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10588/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=2,032,896,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10589/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=2,033,088,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10590/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=2,033,280,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=10591/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=2,033,472,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10592/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=2,033,664,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10593/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=2,033,856,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10594/500000] + train/ActionL1Loss=0.0339 + throughput/total_tokens=2,034,048,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10595/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=2,034,240,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10596/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=2,034,432,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10597/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=2,034,624,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10598/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=2,034,816,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10599/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=2,035,008,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=10600/500000] + optim/total_grad_norm=10.06 + train/ActionL1Loss=0.0353 + throughput/total_tokens=2,035,200,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=10601/500000] + train/ActionL1Loss=0.0320 + throughput/total_tokens=2,035,392,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10602/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=2,035,584,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10603/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=2,035,776,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10604/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=2,035,968,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10605/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=2,036,160,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10606/500000] + train/ActionL1Loss=0.0285 + throughput/total_tokens=2,036,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10607/500000] + train/ActionL1Loss=0.0339 + throughput/total_tokens=2,036,544,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10608/500000] + train/ActionL1Loss=0.0336 + throughput/total_tokens=2,036,736,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10609/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=2,036,928,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10610/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=2,037,120,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=10611/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=2,037,312,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10612/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=2,037,504,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10613/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=2,037,696,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10614/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=2,037,888,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10615/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=2,038,080,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10616/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=2,038,272,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10617/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=2,038,464,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10618/500000] + train/ActionL1Loss=0.0584 + throughput/total_tokens=2,038,656,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=10619/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=2,038,848,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10620/500000] + optim/total_grad_norm=8.035 + train/ActionL1Loss=0.0432 + throughput/total_tokens=2,039,040,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10621/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=2,039,232,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10622/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=2,039,424,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10623/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=2,039,616,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10624/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=2,039,808,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10625/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=2,040,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10626/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=2,040,192,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10627/500000] + train/ActionL1Loss=0.0606 + throughput/total_tokens=2,040,384,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10628/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=2,040,576,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10629/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=2,040,768,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10630/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=2,040,960,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10631/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=2,041,152,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10632/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=2,041,344,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10633/500000] + train/ActionL1Loss=0.0307 + throughput/total_tokens=2,041,536,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10634/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=2,041,728,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10635/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=2,041,920,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10636/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=2,042,112,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10637/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=2,042,304,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10638/500000] + train/ActionL1Loss=0.0350 + throughput/total_tokens=2,042,496,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10639/500000] + train/ActionL1Loss=0.0276 + throughput/total_tokens=2,042,688,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10640/500000] + optim/total_grad_norm=7.663 + train/ActionL1Loss=0.0558 + throughput/total_tokens=2,042,880,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10641/500000] + train/ActionL1Loss=0.0267 + throughput/total_tokens=2,043,072,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10642/500000] + train/ActionL1Loss=0.0174 + throughput/total_tokens=2,043,264,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10643/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=2,043,456,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10644/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=2,043,648,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10645/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=2,043,840,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10646/500000] + train/ActionL1Loss=0.0259 + throughput/total_tokens=2,044,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10647/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=2,044,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10648/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=2,044,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10649/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=2,044,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10650/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=2,044,800,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10651/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=2,044,992,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10652/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=2,045,184,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10653/500000] + train/ActionL1Loss=0.0324 + throughput/total_tokens=2,045,376,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=10654/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=2,045,568,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10655/500000] + train/ActionL1Loss=0.0340 + throughput/total_tokens=2,045,760,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=10656/500000] + train/ActionL1Loss=0.0309 + throughput/total_tokens=2,045,952,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=10657/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=2,046,144,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=10658/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=2,046,336,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10659/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=2,046,528,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10660/500000] + optim/total_grad_norm=8.751 + train/ActionL1Loss=0.0336 + throughput/total_tokens=2,046,720,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=10661/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=2,046,912,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10662/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=2,047,104,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10663/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=2,047,296,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=10664/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=2,047,488,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10665/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=2,047,680,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10666/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=2,047,872,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10667/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=2,048,064,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10668/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=2,048,256,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10669/500000] + train/ActionL1Loss=0.0265 + throughput/total_tokens=2,048,448,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10670/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=2,048,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10671/500000] + train/ActionL1Loss=0.0286 + throughput/total_tokens=2,048,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10672/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=2,049,024,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10673/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=2,049,216,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10674/500000] + train/ActionL1Loss=0.0598 + throughput/total_tokens=2,049,408,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10675/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=2,049,600,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10676/500000] + train/ActionL1Loss=0.0342 + throughput/total_tokens=2,049,792,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10677/500000] + train/ActionL1Loss=0.0581 + throughput/total_tokens=2,049,984,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10678/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=2,050,176,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10679/500000] + train/ActionL1Loss=0.0311 + throughput/total_tokens=2,050,368,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10680/500000] + optim/total_grad_norm=7.457 + train/ActionL1Loss=0.0360 + throughput/total_tokens=2,050,560,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10681/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=2,050,752,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10682/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=2,050,944,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10683/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=2,051,136,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10684/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=2,051,328,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10685/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=2,051,520,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10686/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=2,051,712,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10687/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=2,051,904,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10688/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=2,052,096,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10689/500000] + train/ActionL1Loss=0.0356 + throughput/total_tokens=2,052,288,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10690/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=2,052,480,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10691/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=2,052,672,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10692/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=2,052,864,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10693/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=2,053,056,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10694/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=2,053,248,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10695/500000] + train/ActionL1Loss=0.0287 + throughput/total_tokens=2,053,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10696/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=2,053,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10697/500000] + train/ActionL1Loss=0.0301 + throughput/total_tokens=2,053,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10698/500000] + train/ActionL1Loss=0.0315 + throughput/total_tokens=2,054,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10699/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=2,054,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10700/500000] + optim/total_grad_norm=10.58 + train/ActionL1Loss=0.0590 + throughput/total_tokens=2,054,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10701/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=2,054,592,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10702/500000] + train/ActionL1Loss=0.0666 + throughput/total_tokens=2,054,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10703/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=2,054,976,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10704/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=2,055,168,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10705/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=2,055,360,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10706/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=2,055,552,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=10707/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=2,055,744,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10708/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=2,055,936,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=10709/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=2,056,128,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=10710/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=2,056,320,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=10711/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=2,056,512,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10712/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=2,056,704,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10713/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=2,056,896,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10714/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=2,057,088,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10715/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=2,057,280,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10716/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=2,057,472,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10717/500000] + train/ActionL1Loss=0.0369 + throughput/total_tokens=2,057,664,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10718/500000] + train/ActionL1Loss=0.0311 + throughput/total_tokens=2,057,856,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10719/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=2,058,048,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10720/500000] + optim/total_grad_norm=9.949 + train/ActionL1Loss=0.0623 + throughput/total_tokens=2,058,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10721/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=2,058,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10722/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=2,058,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10723/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=2,058,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10724/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,059,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10725/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=2,059,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10726/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=2,059,392,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10727/500000] + train/ActionL1Loss=0.0341 + throughput/total_tokens=2,059,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10728/500000] + train/ActionL1Loss=0.0369 + throughput/total_tokens=2,059,776,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10729/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=2,059,968,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10730/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=2,060,160,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=10731/500000] + train/ActionL1Loss=0.0354 + throughput/total_tokens=2,060,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10732/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,060,544,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10733/500000] + train/ActionL1Loss=0.0288 + throughput/total_tokens=2,060,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10734/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=2,060,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10735/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=2,061,120,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10736/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=2,061,312,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10737/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=2,061,504,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10738/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=2,061,696,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10739/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=2,061,888,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10740/500000] + optim/total_grad_norm=8.208 + train/ActionL1Loss=0.0469 + throughput/total_tokens=2,062,080,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10741/500000] + train/ActionL1Loss=0.0339 + throughput/total_tokens=2,062,272,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10742/500000] + train/ActionL1Loss=0.0343 + throughput/total_tokens=2,062,464,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10743/500000] + train/ActionL1Loss=0.0326 + throughput/total_tokens=2,062,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10744/500000] + train/ActionL1Loss=0.0317 + throughput/total_tokens=2,062,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10745/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=2,063,040,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10746/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=2,063,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10747/500000] + train/ActionL1Loss=0.0340 + throughput/total_tokens=2,063,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10748/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=2,063,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10749/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=2,063,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10750/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=2,064,000,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10751/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=2,064,192,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10752/500000] + train/ActionL1Loss=0.0296 + throughput/total_tokens=2,064,384,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10753/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=2,064,576,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10754/500000] + train/ActionL1Loss=0.0325 + throughput/total_tokens=2,064,768,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10755/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=2,064,960,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10756/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=2,065,152,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10757/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=2,065,344,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10758/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=2,065,536,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10759/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=2,065,728,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10760/500000] + optim/total_grad_norm=8.273 + train/ActionL1Loss=0.0515 + throughput/total_tokens=2,065,920,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10761/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=2,066,112,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10762/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=2,066,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10763/500000] + train/ActionL1Loss=0.0281 + throughput/total_tokens=2,066,496,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10764/500000] + train/ActionL1Loss=0.0305 + throughput/total_tokens=2,066,688,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10765/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=2,066,880,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10766/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=2,067,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10767/500000] + train/ActionL1Loss=0.0316 + throughput/total_tokens=2,067,264,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10768/500000] + train/ActionL1Loss=0.0639 + throughput/total_tokens=2,067,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10769/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=2,067,648,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10770/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=2,067,840,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10771/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=2,068,032,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10772/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=2,068,224,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10773/500000] + train/ActionL1Loss=0.0331 + throughput/total_tokens=2,068,416,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10774/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=2,068,608,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10775/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=2,068,800,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10776/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=2,068,992,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10777/500000] + train/ActionL1Loss=0.0260 + throughput/total_tokens=2,069,184,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10778/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=2,069,376,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10779/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=2,069,568,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10780/500000] + optim/total_grad_norm=9.962 + train/ActionL1Loss=0.0317 + throughput/total_tokens=2,069,760,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10781/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=2,069,952,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10782/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=2,070,144,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10783/500000] + train/ActionL1Loss=0.0394 + throughput/total_tokens=2,070,336,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10784/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=2,070,528,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10785/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=2,070,720,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10786/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=2,070,912,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10787/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=2,071,104,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10788/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=2,071,296,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10789/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=2,071,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10790/500000] + train/ActionL1Loss=0.0306 + throughput/total_tokens=2,071,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=10791/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=2,071,872,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10792/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=2,072,064,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10793/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=2,072,256,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10794/500000] + train/ActionL1Loss=0.0359 + throughput/total_tokens=2,072,448,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10795/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=2,072,640,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10796/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=2,072,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10797/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=2,073,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10798/500000] + train/ActionL1Loss=0.0344 + throughput/total_tokens=2,073,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10799/500000] + train/ActionL1Loss=0.0336 + throughput/total_tokens=2,073,408,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10800/500000] + optim/total_grad_norm=6.678 + train/ActionL1Loss=0.0429 + throughput/total_tokens=2,073,600,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10801/500000] + train/ActionL1Loss=0.0651 + throughput/total_tokens=2,073,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10802/500000] + train/ActionL1Loss=0.0242 + throughput/total_tokens=2,073,984,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10803/500000] + train/ActionL1Loss=0.0335 + throughput/total_tokens=2,074,176,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10804/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=2,074,368,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10805/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=2,074,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10806/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=2,074,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10807/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=2,074,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10808/500000] + train/ActionL1Loss=0.0317 + throughput/total_tokens=2,075,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10809/500000] + train/ActionL1Loss=0.0331 + throughput/total_tokens=2,075,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10810/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=2,075,520,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=10811/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=2,075,712,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10812/500000] + train/ActionL1Loss=0.0277 + throughput/total_tokens=2,075,904,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10813/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=2,076,096,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10814/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=2,076,288,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10815/500000] + train/ActionL1Loss=0.0358 + throughput/total_tokens=2,076,480,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10816/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=2,076,672,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10817/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=2,076,864,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10818/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=2,077,056,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10819/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=2,077,248,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10820/500000] + optim/total_grad_norm=8.815 + train/ActionL1Loss=0.0553 + throughput/total_tokens=2,077,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10821/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=2,077,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10822/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=2,077,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10823/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=2,078,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10824/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=2,078,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10825/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=2,078,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10826/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=2,078,592,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10827/500000] + train/ActionL1Loss=0.0601 + throughput/total_tokens=2,078,784,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10828/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=2,078,976,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10829/500000] + train/ActionL1Loss=0.0265 + throughput/total_tokens=2,079,168,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10830/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=2,079,360,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10831/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=2,079,552,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10832/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=2,079,744,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10833/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=2,079,936,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10834/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=2,080,128,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10835/500000] + train/ActionL1Loss=0.0669 + throughput/total_tokens=2,080,320,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10836/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=2,080,512,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10837/500000] + train/ActionL1Loss=0.0678 + throughput/total_tokens=2,080,704,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10838/500000] + train/ActionL1Loss=0.0293 + throughput/total_tokens=2,080,896,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10839/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=2,081,088,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10840/500000] + optim/total_grad_norm=7.830 + train/ActionL1Loss=0.0575 + throughput/total_tokens=2,081,280,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10841/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=2,081,472,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10842/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=2,081,664,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10843/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=2,081,856,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10844/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=2,082,048,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10845/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=2,082,240,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10846/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=2,082,432,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10847/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=2,082,624,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10848/500000] + train/ActionL1Loss=0.0356 + throughput/total_tokens=2,082,816,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10849/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=2,083,008,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10850/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=2,083,200,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10851/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=2,083,392,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10852/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=2,083,584,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10853/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=2,083,776,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10854/500000] + train/ActionL1Loss=0.0285 + throughput/total_tokens=2,083,968,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10855/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=2,084,160,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10856/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=2,084,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10857/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=2,084,544,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10858/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=2,084,736,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10859/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=2,084,928,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10860/500000] + optim/total_grad_norm=7.763 + train/ActionL1Loss=0.0448 + throughput/total_tokens=2,085,120,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=10861/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=2,085,312,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10862/500000] + train/ActionL1Loss=0.0355 + throughput/total_tokens=2,085,504,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10863/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=2,085,696,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10864/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,085,888,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10865/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=2,086,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10866/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=2,086,272,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10867/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=2,086,464,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10868/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=2,086,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10869/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=2,086,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10870/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=2,087,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10871/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=2,087,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10872/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=2,087,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10873/500000] + train/ActionL1Loss=0.0619 + throughput/total_tokens=2,087,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10874/500000] + train/ActionL1Loss=0.0329 + throughput/total_tokens=2,087,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10875/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=2,088,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10876/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=2,088,192,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10877/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=2,088,384,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10878/500000] + train/ActionL1Loss=0.0207 + throughput/total_tokens=2,088,576,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10879/500000] + train/ActionL1Loss=0.0308 + throughput/total_tokens=2,088,768,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10880/500000] + optim/total_grad_norm=9.134 + train/ActionL1Loss=0.0229 + throughput/total_tokens=2,088,960,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10881/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=2,089,152,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10882/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=2,089,344,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10883/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=2,089,536,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10884/500000] + train/ActionL1Loss=0.0301 + throughput/total_tokens=2,089,728,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10885/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=2,089,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10886/500000] + train/ActionL1Loss=0.0339 + throughput/total_tokens=2,090,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10887/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=2,090,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10888/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=2,090,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10889/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=2,090,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10890/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=2,090,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10891/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=2,091,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10892/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=2,091,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10893/500000] + train/ActionL1Loss=0.0300 + throughput/total_tokens=2,091,456,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10894/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=2,091,648,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10895/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=2,091,840,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10896/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=2,092,032,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10897/500000] + train/ActionL1Loss=0.0284 + throughput/total_tokens=2,092,224,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10898/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=2,092,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10899/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=2,092,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10900/500000] + optim/total_grad_norm=8.212 + train/ActionL1Loss=0.0393 + throughput/total_tokens=2,092,800,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10901/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=2,092,992,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=10902/500000] + train/ActionL1Loss=0.0358 + throughput/total_tokens=2,093,184,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10903/500000] + train/ActionL1Loss=0.0356 + throughput/total_tokens=2,093,376,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=10904/500000] + train/ActionL1Loss=0.0369 + throughput/total_tokens=2,093,568,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10905/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=2,093,760,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=10906/500000] + train/ActionL1Loss=0.0292 + throughput/total_tokens=2,093,952,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10907/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=2,094,144,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10908/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=2,094,336,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10909/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=2,094,528,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10910/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=2,094,720,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=10911/500000] + train/ActionL1Loss=0.0377 + throughput/total_tokens=2,094,912,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10912/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=2,095,104,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10913/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=2,095,296,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10914/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=2,095,488,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10915/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=2,095,680,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10916/500000] + train/ActionL1Loss=0.0320 + throughput/total_tokens=2,095,872,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10917/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=2,096,064,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10918/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=2,096,256,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10919/500000] + train/ActionL1Loss=0.0260 + throughput/total_tokens=2,096,448,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=10920/500000] + optim/total_grad_norm=6.412 + train/ActionL1Loss=0.0394 + throughput/total_tokens=2,096,640,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=10921/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=2,096,832,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10922/500000] + train/ActionL1Loss=0.0328 + throughput/total_tokens=2,097,024,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10923/500000] + train/ActionL1Loss=0.0294 + throughput/total_tokens=2,097,216,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10924/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=2,097,408,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10925/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=2,097,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10926/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=2,097,792,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=10927/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=2,097,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10928/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=2,098,176,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10929/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=2,098,368,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=10930/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=2,098,560,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10931/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=2,098,752,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10932/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=2,098,944,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10933/500000] + train/ActionL1Loss=0.0275 + throughput/total_tokens=2,099,136,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10934/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=2,099,328,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10935/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=2,099,520,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10936/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=2,099,712,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10937/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=2,099,904,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10938/500000] + train/ActionL1Loss=0.0588 + throughput/total_tokens=2,100,096,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10939/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=2,100,288,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10940/500000] + optim/total_grad_norm=8.876 + train/ActionL1Loss=0.0436 + throughput/total_tokens=2,100,480,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10941/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=2,100,672,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10942/500000] + train/ActionL1Loss=0.0333 + throughput/total_tokens=2,100,864,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10943/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=2,101,056,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10944/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=2,101,248,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10945/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=2,101,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10946/500000] + train/ActionL1Loss=0.0661 + throughput/total_tokens=2,101,632,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10947/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=2,101,824,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10948/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=2,102,016,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10949/500000] + train/ActionL1Loss=0.0587 + throughput/total_tokens=2,102,208,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=10950/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=2,102,400,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10951/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=2,102,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10952/500000] + train/ActionL1Loss=0.0387 + throughput/total_tokens=2,102,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10953/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=2,102,976,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10954/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=2,103,168,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10955/500000] + train/ActionL1Loss=0.0315 + throughput/total_tokens=2,103,360,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10956/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=2,103,552,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10957/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=2,103,744,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=10958/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=2,103,936,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10959/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=2,104,128,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10960/500000] + optim/total_grad_norm=7.206 + train/ActionL1Loss=0.0394 + throughput/total_tokens=2,104,320,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=10961/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=2,104,512,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10962/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=2,104,704,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10963/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=2,104,896,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10964/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=2,105,088,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10965/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=2,105,280,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=10966/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=2,105,472,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10967/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=2,105,664,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10968/500000] + train/ActionL1Loss=0.0284 + throughput/total_tokens=2,105,856,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10969/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=2,106,048,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=10970/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=2,106,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=10971/500000] + train/ActionL1Loss=0.0245 + throughput/total_tokens=2,106,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10972/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=2,106,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10973/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=2,106,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10974/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=2,107,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10975/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=2,107,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10976/500000] + train/ActionL1Loss=0.0325 + throughput/total_tokens=2,107,392,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10977/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=2,107,584,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10978/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=2,107,776,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10979/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=2,107,968,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10980/500000] + optim/total_grad_norm=8.689 + train/ActionL1Loss=0.0495 + throughput/total_tokens=2,108,160,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10981/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=2,108,352,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10982/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=2,108,544,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10983/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=2,108,736,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=10984/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=2,108,928,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10985/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=2,109,120,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10986/500000] + train/ActionL1Loss=0.0320 + throughput/total_tokens=2,109,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10987/500000] + train/ActionL1Loss=0.0171 + throughput/total_tokens=2,109,504,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10988/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=2,109,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10989/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=2,109,888,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10990/500000] + train/ActionL1Loss=0.0514 + throughput/total_tokens=2,110,080,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=10991/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=2,110,272,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=10992/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=2,110,464,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10993/500000] + train/ActionL1Loss=0.0314 + throughput/total_tokens=2,110,656,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10994/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=2,110,848,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=10995/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=2,111,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10996/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=2,111,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10997/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=2,111,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10998/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=2,111,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=10999/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=2,111,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11000/500000] + optim/total_grad_norm=8.413 + train/ActionL1Loss=0.0374 + throughput/total_tokens=2,112,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +10/14 [08:38:56] INFO | >> Saving config... checkpoint.py:608 +10/14 [08:39:39] INFO | >> Saving model state... checkpoint.py:796 +10/14 [08:40:50] INFO | >> Saving optim state... checkpoint.py:811 +10/14 [08:42:22] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=11001/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=2,112,192,000 + throughput/device/tokens_per_second=1,210 + throughput/device/batches_per_second=0.0504 +[step=11002/500000] + train/ActionL1Loss=0.0286 + throughput/total_tokens=2,112,384,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=11003/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=2,112,576,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11004/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=2,112,768,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11005/500000] + train/ActionL1Loss=0.0536 + throughput/total_tokens=2,112,960,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=11006/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=2,113,152,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=11007/500000] + train/ActionL1Loss=0.0316 + throughput/total_tokens=2,113,344,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11008/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=2,113,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11009/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=2,113,728,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11010/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=2,113,920,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=11011/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=2,114,112,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11012/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=2,114,304,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11013/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=2,114,496,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11014/500000] + train/ActionL1Loss=0.0342 + throughput/total_tokens=2,114,688,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11015/500000] + train/ActionL1Loss=0.0334 + throughput/total_tokens=2,114,880,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11016/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=2,115,072,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11017/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=2,115,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11018/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=2,115,456,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11019/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=2,115,648,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11020/500000] + optim/total_grad_norm=6.544 + train/ActionL1Loss=0.0389 + throughput/total_tokens=2,115,840,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11021/500000] + train/ActionL1Loss=0.0431 + throughput/total_tokens=2,116,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11022/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=2,116,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11023/500000] + train/ActionL1Loss=0.0346 + throughput/total_tokens=2,116,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11024/500000] + train/ActionL1Loss=0.0246 + throughput/total_tokens=2,116,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11025/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=2,116,800,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11026/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=2,116,992,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11027/500000] + train/ActionL1Loss=0.0344 + throughput/total_tokens=2,117,184,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11028/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=2,117,376,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11029/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=2,117,568,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11030/500000] + train/ActionL1Loss=0.0296 + throughput/total_tokens=2,117,760,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11031/500000] + train/ActionL1Loss=0.0320 + throughput/total_tokens=2,117,952,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11032/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=2,118,144,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11033/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=2,118,336,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11034/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=2,118,528,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11035/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=2,118,720,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11036/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=2,118,912,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11037/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=2,119,104,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11038/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=2,119,296,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11039/500000] + train/ActionL1Loss=0.0310 + throughput/total_tokens=2,119,488,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11040/500000] + optim/total_grad_norm=7.718 + train/ActionL1Loss=0.0380 + throughput/total_tokens=2,119,680,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11041/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=2,119,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11042/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=2,120,064,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11043/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=2,120,256,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11044/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=2,120,448,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11045/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=2,120,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11046/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=2,120,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11047/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=2,121,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11048/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=2,121,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11049/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=2,121,408,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11050/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=2,121,600,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11051/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=2,121,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11052/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=2,121,984,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11053/500000] + train/ActionL1Loss=0.0326 + throughput/total_tokens=2,122,176,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11054/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=2,122,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11055/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=2,122,560,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11056/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=2,122,752,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11057/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,122,944,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11058/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=2,123,136,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11059/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=2,123,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11060/500000] + optim/total_grad_norm=5.623 + train/ActionL1Loss=0.0348 + throughput/total_tokens=2,123,520,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11061/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=2,123,712,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11062/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=2,123,904,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11063/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=2,124,096,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11064/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=2,124,288,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11065/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=2,124,480,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11066/500000] + train/ActionL1Loss=0.0585 + throughput/total_tokens=2,124,672,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11067/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=2,124,864,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11068/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=2,125,056,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11069/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=2,125,248,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11070/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=2,125,440,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=11071/500000] + train/ActionL1Loss=0.0359 + throughput/total_tokens=2,125,632,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=11072/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=2,125,824,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=11073/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=2,126,016,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=11074/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=2,126,208,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=11075/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=2,126,400,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=11076/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=2,126,592,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=11077/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=2,126,784,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=11078/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=2,126,976,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=11079/500000] + train/ActionL1Loss=0.0281 + throughput/total_tokens=2,127,168,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=11080/500000] + optim/total_grad_norm=7.693 + train/ActionL1Loss=0.0450 + throughput/total_tokens=2,127,360,000 + throughput/device/tokens_per_second=1,183 + throughput/device/batches_per_second=0.0493 + System/Peak GPU Memory (MB)=46,924 +[step=11081/500000] + train/ActionL1Loss=0.0243 + throughput/total_tokens=2,127,552,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=11082/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=2,127,744,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=11083/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=2,127,936,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=11084/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=2,128,128,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=11085/500000] + train/ActionL1Loss=0.0278 + throughput/total_tokens=2,128,320,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=11086/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=2,128,512,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11087/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=2,128,704,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11088/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=2,128,896,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11089/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=2,129,088,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11090/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=2,129,280,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=11091/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=2,129,472,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11092/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=2,129,664,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11093/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=2,129,856,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11094/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=2,130,048,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11095/500000] + train/ActionL1Loss=0.0294 + throughput/total_tokens=2,130,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11096/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=2,130,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11097/500000] + train/ActionL1Loss=0.0372 + throughput/total_tokens=2,130,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11098/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=2,130,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11099/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=2,131,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11100/500000] + optim/total_grad_norm=7.712 + train/ActionL1Loss=0.0510 + throughput/total_tokens=2,131,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=11101/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=2,131,392,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11102/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=2,131,584,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11103/500000] + train/ActionL1Loss=0.0301 + throughput/total_tokens=2,131,776,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11104/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=2,131,968,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11105/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=2,132,160,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11106/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=2,132,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11107/500000] + train/ActionL1Loss=0.0350 + throughput/total_tokens=2,132,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11108/500000] + train/ActionL1Loss=0.0318 + throughput/total_tokens=2,132,736,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11109/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=2,132,928,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11110/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=2,133,120,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11111/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=2,133,312,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11112/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=2,133,504,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11113/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=2,133,696,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11114/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=2,133,888,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11115/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=2,134,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11116/500000] + train/ActionL1Loss=0.0285 + throughput/total_tokens=2,134,272,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11117/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=2,134,464,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11118/500000] + train/ActionL1Loss=0.0583 + throughput/total_tokens=2,134,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11119/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=2,134,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11120/500000] + optim/total_grad_norm=6.555 + train/ActionL1Loss=0.0430 + throughput/total_tokens=2,135,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11121/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=2,135,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11122/500000] + train/ActionL1Loss=0.0355 + throughput/total_tokens=2,135,424,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11123/500000] + train/ActionL1Loss=0.0387 + throughput/total_tokens=2,135,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11124/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=2,135,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11125/500000] + train/ActionL1Loss=0.0242 + throughput/total_tokens=2,136,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11126/500000] + train/ActionL1Loss=0.0314 + throughput/total_tokens=2,136,192,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11127/500000] + train/ActionL1Loss=0.0318 + throughput/total_tokens=2,136,384,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11128/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=2,136,576,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11129/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=2,136,768,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11130/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=2,136,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11131/500000] + train/ActionL1Loss=0.0551 + throughput/total_tokens=2,137,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11132/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=2,137,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11133/500000] + train/ActionL1Loss=0.0287 + throughput/total_tokens=2,137,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11134/500000] + train/ActionL1Loss=0.0278 + throughput/total_tokens=2,137,728,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11135/500000] + train/ActionL1Loss=0.0325 + throughput/total_tokens=2,137,920,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11136/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=2,138,112,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11137/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=2,138,304,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11138/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=2,138,496,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11139/500000] + train/ActionL1Loss=0.0748 + throughput/total_tokens=2,138,688,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11140/500000] + optim/total_grad_norm=9.141 + train/ActionL1Loss=0.0537 + throughput/total_tokens=2,138,880,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11141/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=2,139,072,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11142/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=2,139,264,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11143/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=2,139,456,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11144/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=2,139,648,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11145/500000] + train/ActionL1Loss=0.0294 + throughput/total_tokens=2,139,840,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11146/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=2,140,032,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11147/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=2,140,224,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11148/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=2,140,416,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11149/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=2,140,608,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11150/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=2,140,800,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11151/500000] + train/ActionL1Loss=0.0568 + throughput/total_tokens=2,140,992,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=11152/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=2,141,184,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=11153/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=2,141,376,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=11154/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=2,141,568,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11155/500000] + train/ActionL1Loss=0.0354 + throughput/total_tokens=2,141,760,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11156/500000] + train/ActionL1Loss=0.0347 + throughput/total_tokens=2,141,952,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11157/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=2,142,144,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11158/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=2,142,336,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11159/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=2,142,528,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11160/500000] + optim/total_grad_norm=8.441 + train/ActionL1Loss=0.0409 + throughput/total_tokens=2,142,720,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11161/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=2,142,912,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11162/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=2,143,104,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11163/500000] + train/ActionL1Loss=0.0253 + throughput/total_tokens=2,143,296,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11164/500000] + train/ActionL1Loss=0.0306 + throughput/total_tokens=2,143,488,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11165/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=2,143,680,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=11166/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=2,143,872,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=11167/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=2,144,064,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=11168/500000] + train/ActionL1Loss=0.0306 + throughput/total_tokens=2,144,256,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0488 +[step=11169/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=2,144,448,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=11170/500000] + train/ActionL1Loss=0.0321 + throughput/total_tokens=2,144,640,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11171/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=2,144,832,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11172/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=2,145,024,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11173/500000] + train/ActionL1Loss=0.0595 + throughput/total_tokens=2,145,216,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11174/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=2,145,408,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11175/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=2,145,600,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11176/500000] + train/ActionL1Loss=0.0232 + throughput/total_tokens=2,145,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11177/500000] + train/ActionL1Loss=0.0359 + throughput/total_tokens=2,145,984,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11178/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=2,146,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11179/500000] + train/ActionL1Loss=0.0272 + throughput/total_tokens=2,146,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11180/500000] + optim/total_grad_norm=7.699 + train/ActionL1Loss=0.0350 + throughput/total_tokens=2,146,560,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11181/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=2,146,752,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11182/500000] + train/ActionL1Loss=0.0359 + throughput/total_tokens=2,146,944,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11183/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=2,147,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11184/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=2,147,328,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11185/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=2,147,520,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11186/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=2,147,712,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11187/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=2,147,904,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11188/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=2,148,096,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11189/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=2,148,288,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11190/500000] + train/ActionL1Loss=0.0549 + throughput/total_tokens=2,148,480,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=11191/500000] + train/ActionL1Loss=0.0458 + throughput/total_tokens=2,148,672,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11192/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=2,148,864,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11193/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=2,149,056,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11194/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=2,149,248,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11195/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=2,149,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11196/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=2,149,632,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11197/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=2,149,824,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11198/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=2,150,016,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11199/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=2,150,208,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=11200/500000] + optim/total_grad_norm=7.729 + train/ActionL1Loss=0.0465 + throughput/total_tokens=2,150,400,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=11201/500000] + train/ActionL1Loss=0.0281 + throughput/total_tokens=2,150,592,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11202/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=2,150,784,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11203/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=2,150,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11204/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=2,151,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11205/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=2,151,360,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11206/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=2,151,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11207/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=2,151,744,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11208/500000] + train/ActionL1Loss=0.0309 + throughput/total_tokens=2,151,936,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11209/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=2,152,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11210/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=2,152,320,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11211/500000] + train/ActionL1Loss=0.0324 + throughput/total_tokens=2,152,512,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11212/500000] + train/ActionL1Loss=0.0260 + throughput/total_tokens=2,152,704,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11213/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=2,152,896,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11214/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=2,153,088,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11215/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=2,153,280,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11216/500000] + train/ActionL1Loss=0.0588 + throughput/total_tokens=2,153,472,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11217/500000] + train/ActionL1Loss=0.0306 + throughput/total_tokens=2,153,664,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11218/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=2,153,856,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11219/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=2,154,048,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11220/500000] + optim/total_grad_norm=9.068 + train/ActionL1Loss=0.0386 + throughput/total_tokens=2,154,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11221/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=2,154,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11222/500000] + train/ActionL1Loss=0.0597 + throughput/total_tokens=2,154,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11223/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=2,154,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11224/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=2,155,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11225/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=2,155,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11226/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=2,155,392,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11227/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=2,155,584,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11228/500000] + train/ActionL1Loss=0.0563 + throughput/total_tokens=2,155,776,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11229/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=2,155,968,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11230/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=2,156,160,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11231/500000] + train/ActionL1Loss=0.0347 + throughput/total_tokens=2,156,352,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11232/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=2,156,544,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11233/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=2,156,736,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11234/500000] + train/ActionL1Loss=0.0665 + throughput/total_tokens=2,156,928,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11235/500000] + train/ActionL1Loss=0.0309 + throughput/total_tokens=2,157,120,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11236/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=2,157,312,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11237/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=2,157,504,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11238/500000] + train/ActionL1Loss=0.0372 + throughput/total_tokens=2,157,696,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11239/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=2,157,888,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11240/500000] + optim/total_grad_norm=7.546 + train/ActionL1Loss=0.0482 + throughput/total_tokens=2,158,080,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11241/500000] + train/ActionL1Loss=0.0364 + throughput/total_tokens=2,158,272,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11242/500000] + train/ActionL1Loss=0.0336 + throughput/total_tokens=2,158,464,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11243/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=2,158,656,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11244/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=2,158,848,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11245/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=2,159,040,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11246/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=2,159,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11247/500000] + train/ActionL1Loss=0.0287 + throughput/total_tokens=2,159,424,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11248/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=2,159,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11249/500000] + train/ActionL1Loss=0.0276 + throughput/total_tokens=2,159,808,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11250/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=2,160,000,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11251/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=2,160,192,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=11252/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=2,160,384,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11253/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=2,160,576,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11254/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=2,160,768,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11255/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=2,160,960,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11256/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=2,161,152,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=11257/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=2,161,344,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11258/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=2,161,536,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11259/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=2,161,728,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11260/500000] + optim/total_grad_norm=7.180 + train/ActionL1Loss=0.0344 + throughput/total_tokens=2,161,920,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11261/500000] + train/ActionL1Loss=0.0309 + throughput/total_tokens=2,162,112,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11262/500000] + train/ActionL1Loss=0.0318 + throughput/total_tokens=2,162,304,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11263/500000] + train/ActionL1Loss=0.0349 + throughput/total_tokens=2,162,496,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11264/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=2,162,688,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11265/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=2,162,880,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11266/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=2,163,072,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=11267/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=2,163,264,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=11268/500000] + train/ActionL1Loss=0.0573 + throughput/total_tokens=2,163,456,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11269/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=2,163,648,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11270/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=2,163,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11271/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=2,164,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11272/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=2,164,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11273/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=2,164,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11274/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=2,164,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11275/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=2,164,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11276/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=2,164,992,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11277/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=2,165,184,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11278/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=2,165,376,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11279/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=2,165,568,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11280/500000] + optim/total_grad_norm=8.724 + train/ActionL1Loss=0.0517 + throughput/total_tokens=2,165,760,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11281/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=2,165,952,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11282/500000] + train/ActionL1Loss=0.0288 + throughput/total_tokens=2,166,144,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11283/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=2,166,336,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11284/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=2,166,528,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11285/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=2,166,720,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11286/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=2,166,912,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11287/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=2,167,104,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11288/500000] + train/ActionL1Loss=0.0557 + throughput/total_tokens=2,167,296,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11289/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=2,167,488,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11290/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=2,167,680,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=11291/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=2,167,872,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11292/500000] + train/ActionL1Loss=0.0562 + throughput/total_tokens=2,168,064,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=11293/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=2,168,256,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=11294/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=2,168,448,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=11295/500000] + train/ActionL1Loss=0.0319 + throughput/total_tokens=2,168,640,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11296/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=2,168,832,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11297/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=2,169,024,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=11298/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=2,169,216,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=11299/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=2,169,408,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11300/500000] + optim/total_grad_norm=8.691 + train/ActionL1Loss=0.0480 + throughput/total_tokens=2,169,600,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=11301/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=2,169,792,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11302/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=2,169,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11303/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=2,170,176,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11304/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=2,170,368,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11305/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=2,170,560,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11306/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=2,170,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11307/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=2,170,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11308/500000] + train/ActionL1Loss=0.0347 + throughput/total_tokens=2,171,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11309/500000] + train/ActionL1Loss=0.0282 + throughput/total_tokens=2,171,328,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11310/500000] + train/ActionL1Loss=0.0369 + throughput/total_tokens=2,171,520,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11311/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=2,171,712,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11312/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=2,171,904,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11313/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=2,172,096,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11314/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=2,172,288,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11315/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=2,172,480,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11316/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=2,172,672,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11317/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=2,172,864,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11318/500000] + train/ActionL1Loss=0.0339 + throughput/total_tokens=2,173,056,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11319/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=2,173,248,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11320/500000] + optim/total_grad_norm=8.054 + train/ActionL1Loss=0.0320 + throughput/total_tokens=2,173,440,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11321/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=2,173,632,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11322/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=2,173,824,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11323/500000] + train/ActionL1Loss=0.0270 + throughput/total_tokens=2,174,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11324/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=2,174,208,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11325/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=2,174,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11326/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=2,174,592,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11327/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=2,174,784,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11328/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=2,174,976,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11329/500000] + train/ActionL1Loss=0.0350 + throughput/total_tokens=2,175,168,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11330/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=2,175,360,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=11331/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=2,175,552,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11332/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=2,175,744,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11333/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=2,175,936,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11334/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=2,176,128,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11335/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=2,176,320,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11336/500000] + train/ActionL1Loss=0.0268 + throughput/total_tokens=2,176,512,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11337/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=2,176,704,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11338/500000] + train/ActionL1Loss=0.0282 + throughput/total_tokens=2,176,896,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11339/500000] + train/ActionL1Loss=0.0255 + throughput/total_tokens=2,177,088,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11340/500000] + optim/total_grad_norm=8.750 + train/ActionL1Loss=0.0369 + throughput/total_tokens=2,177,280,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11341/500000] + train/ActionL1Loss=0.0294 + throughput/total_tokens=2,177,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11342/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=2,177,664,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11343/500000] + train/ActionL1Loss=0.0552 + throughput/total_tokens=2,177,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11344/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=2,178,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11345/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=2,178,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11346/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=2,178,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11347/500000] + train/ActionL1Loss=0.0317 + throughput/total_tokens=2,178,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11348/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=2,178,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11349/500000] + train/ActionL1Loss=0.0324 + throughput/total_tokens=2,179,008,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11350/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=2,179,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11351/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=2,179,392,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11352/500000] + train/ActionL1Loss=0.0338 + throughput/total_tokens=2,179,584,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11353/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=2,179,776,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11354/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=2,179,968,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11355/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=2,180,160,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=11356/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=2,180,352,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=11357/500000] + train/ActionL1Loss=0.0301 + throughput/total_tokens=2,180,544,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11358/500000] + train/ActionL1Loss=0.0227 + throughput/total_tokens=2,180,736,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11359/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=2,180,928,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=11360/500000] + optim/total_grad_norm=7.486 + train/ActionL1Loss=0.0420 + throughput/total_tokens=2,181,120,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11361/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=2,181,312,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11362/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=2,181,504,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11363/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=2,181,696,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11364/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=2,181,888,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=11365/500000] + train/ActionL1Loss=0.0613 + throughput/total_tokens=2,182,080,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11366/500000] + train/ActionL1Loss=0.0590 + throughput/total_tokens=2,182,272,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11367/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=2,182,464,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11368/500000] + train/ActionL1Loss=0.0347 + throughput/total_tokens=2,182,656,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11369/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=2,182,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11370/500000] + train/ActionL1Loss=0.0356 + throughput/total_tokens=2,183,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11371/500000] + train/ActionL1Loss=0.0586 + throughput/total_tokens=2,183,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11372/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=2,183,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11373/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=2,183,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11374/500000] + train/ActionL1Loss=0.0237 + throughput/total_tokens=2,183,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11375/500000] + train/ActionL1Loss=0.0223 + throughput/total_tokens=2,184,000,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11376/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=2,184,192,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11377/500000] + train/ActionL1Loss=0.0289 + throughput/total_tokens=2,184,384,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11378/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=2,184,576,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11379/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=2,184,768,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11380/500000] + optim/total_grad_norm=8.511 + train/ActionL1Loss=0.0452 + throughput/total_tokens=2,184,960,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11381/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=2,185,152,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11382/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=2,185,344,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11383/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=2,185,536,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11384/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=2,185,728,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11385/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=2,185,920,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11386/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=2,186,112,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11387/500000] + train/ActionL1Loss=0.0664 + throughput/total_tokens=2,186,304,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11388/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=2,186,496,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11389/500000] + train/ActionL1Loss=0.0594 + throughput/total_tokens=2,186,688,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11390/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=2,186,880,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11391/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=2,187,072,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11392/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=2,187,264,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11393/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=2,187,456,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11394/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=2,187,648,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11395/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=2,187,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11396/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=2,188,032,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11397/500000] + train/ActionL1Loss=0.0359 + throughput/total_tokens=2,188,224,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=11398/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=2,188,416,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=11399/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=2,188,608,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=11400/500000] + optim/total_grad_norm=9.281 + train/ActionL1Loss=0.0401 + throughput/total_tokens=2,188,800,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=11401/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=2,188,992,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11402/500000] + train/ActionL1Loss=0.0570 + throughput/total_tokens=2,189,184,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11403/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=2,189,376,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11404/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=2,189,568,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11405/500000] + train/ActionL1Loss=0.0319 + throughput/total_tokens=2,189,760,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11406/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=2,189,952,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11407/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=2,190,144,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11408/500000] + train/ActionL1Loss=0.0485 + throughput/total_tokens=2,190,336,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11409/500000] + train/ActionL1Loss=0.0340 + throughput/total_tokens=2,190,528,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11410/500000] + train/ActionL1Loss=0.0565 + throughput/total_tokens=2,190,720,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11411/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=2,190,912,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11412/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=2,191,104,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11413/500000] + train/ActionL1Loss=0.0263 + throughput/total_tokens=2,191,296,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11414/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=2,191,488,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11415/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=2,191,680,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11416/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=2,191,872,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11417/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=2,192,064,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11418/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=2,192,256,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11419/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=2,192,448,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11420/500000] + optim/total_grad_norm=8.181 + train/ActionL1Loss=0.0455 + throughput/total_tokens=2,192,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11421/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=2,192,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11422/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=2,193,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11423/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=2,193,216,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11424/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=2,193,408,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11425/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=2,193,600,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11426/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=2,193,792,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11427/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=2,193,984,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11428/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=2,194,176,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11429/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=2,194,368,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11430/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=2,194,560,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11431/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=2,194,752,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11432/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=2,194,944,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11433/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=2,195,136,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11434/500000] + train/ActionL1Loss=0.0321 + throughput/total_tokens=2,195,328,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11435/500000] + train/ActionL1Loss=0.0338 + throughput/total_tokens=2,195,520,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11436/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=2,195,712,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11437/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=2,195,904,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11438/500000] + train/ActionL1Loss=0.0426 + throughput/total_tokens=2,196,096,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11439/500000] + train/ActionL1Loss=0.0314 + throughput/total_tokens=2,196,288,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11440/500000] + optim/total_grad_norm=8.003 + train/ActionL1Loss=0.0478 + throughput/total_tokens=2,196,480,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11441/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=2,196,672,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11442/500000] + train/ActionL1Loss=0.0314 + throughput/total_tokens=2,196,864,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11443/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=2,197,056,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11444/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=2,197,248,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11445/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=2,197,440,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11446/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=2,197,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11447/500000] + train/ActionL1Loss=0.0541 + throughput/total_tokens=2,197,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11448/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,198,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11449/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=2,198,208,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11450/500000] + train/ActionL1Loss=0.0495 + throughput/total_tokens=2,198,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11451/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=2,198,592,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11452/500000] + train/ActionL1Loss=0.0343 + throughput/total_tokens=2,198,784,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11453/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=2,198,976,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11454/500000] + train/ActionL1Loss=0.0335 + throughput/total_tokens=2,199,168,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11455/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=2,199,360,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11456/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=2,199,552,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11457/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=2,199,744,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11458/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=2,199,936,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11459/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=2,200,128,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11460/500000] + optim/total_grad_norm=9.578 + train/ActionL1Loss=0.0319 + throughput/total_tokens=2,200,320,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11461/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=2,200,512,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11462/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=2,200,704,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11463/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=2,200,896,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11464/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=2,201,088,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11465/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=2,201,280,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11466/500000] + train/ActionL1Loss=0.0320 + throughput/total_tokens=2,201,472,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11467/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=2,201,664,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11468/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=2,201,856,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11469/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=2,202,048,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11470/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=2,202,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11471/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=2,202,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11472/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=2,202,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11473/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=2,202,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11474/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=2,203,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11475/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=2,203,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11476/500000] + train/ActionL1Loss=0.0324 + throughput/total_tokens=2,203,392,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11477/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=2,203,584,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11478/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=2,203,776,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11479/500000] + train/ActionL1Loss=0.0339 + throughput/total_tokens=2,203,968,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11480/500000] + optim/total_grad_norm=7.866 + train/ActionL1Loss=0.0387 + throughput/total_tokens=2,204,160,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11481/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=2,204,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11482/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=2,204,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11483/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=2,204,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11484/500000] + train/ActionL1Loss=0.0278 + throughput/total_tokens=2,204,928,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11485/500000] + train/ActionL1Loss=0.0290 + throughput/total_tokens=2,205,120,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11486/500000] + train/ActionL1Loss=0.0373 + throughput/total_tokens=2,205,312,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11487/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=2,205,504,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11488/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=2,205,696,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11489/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=2,205,888,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11490/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=2,206,080,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11491/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=2,206,272,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11492/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=2,206,464,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11493/500000] + train/ActionL1Loss=0.0497 + throughput/total_tokens=2,206,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11494/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=2,206,848,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11495/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=2,207,040,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11496/500000] + train/ActionL1Loss=0.0658 + throughput/total_tokens=2,207,232,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11497/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=2,207,424,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11498/500000] + train/ActionL1Loss=0.0604 + throughput/total_tokens=2,207,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11499/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=2,207,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11500/500000] + optim/total_grad_norm=8.182 + train/ActionL1Loss=0.0610 + throughput/total_tokens=2,208,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +10/14 [11:33:28] INFO | >> Saving config... checkpoint.py:608 +10/14 [11:34:11] INFO | >> Saving model state... checkpoint.py:796 +10/14 [11:35:23] INFO | >> Saving optim state... checkpoint.py:811 +10/14 [11:36:55] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=11501/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=2,208,192,000 + throughput/device/tokens_per_second=1,207 + throughput/device/batches_per_second=0.0503 +[step=11502/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=2,208,384,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=11503/500000] + train/ActionL1Loss=0.0317 + throughput/total_tokens=2,208,576,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11504/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=2,208,768,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11505/500000] + train/ActionL1Loss=0.0513 + throughput/total_tokens=2,208,960,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11506/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=2,209,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11507/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=2,209,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11508/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=2,209,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11509/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=2,209,728,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11510/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=2,209,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11511/500000] + train/ActionL1Loss=0.0310 + throughput/total_tokens=2,210,112,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11512/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=2,210,304,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11513/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=2,210,496,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11514/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=2,210,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11515/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=2,210,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11516/500000] + train/ActionL1Loss=0.0328 + throughput/total_tokens=2,211,072,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11517/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=2,211,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11518/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=2,211,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11519/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=2,211,648,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11520/500000] + optim/total_grad_norm=9.287 + train/ActionL1Loss=0.0275 + throughput/total_tokens=2,211,840,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11521/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=2,212,032,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=11522/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=2,212,224,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11523/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,212,416,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11524/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=2,212,608,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11525/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=2,212,800,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11526/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=2,212,992,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11527/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=2,213,184,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11528/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=2,213,376,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11529/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=2,213,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11530/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=2,213,760,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11531/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=2,213,952,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11532/500000] + train/ActionL1Loss=0.0320 + throughput/total_tokens=2,214,144,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11533/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=2,214,336,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11534/500000] + train/ActionL1Loss=0.0394 + throughput/total_tokens=2,214,528,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11535/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=2,214,720,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11536/500000] + train/ActionL1Loss=0.0300 + throughput/total_tokens=2,214,912,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11537/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,215,104,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11538/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=2,215,296,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11539/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=2,215,488,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11540/500000] + optim/total_grad_norm=8.681 + train/ActionL1Loss=0.0415 + throughput/total_tokens=2,215,680,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=11541/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=2,215,872,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11542/500000] + train/ActionL1Loss=0.0326 + throughput/total_tokens=2,216,064,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11543/500000] + train/ActionL1Loss=0.0344 + throughput/total_tokens=2,216,256,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11544/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=2,216,448,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11545/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=2,216,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11546/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=2,216,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11547/500000] + train/ActionL1Loss=0.0554 + throughput/total_tokens=2,217,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11548/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=2,217,216,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11549/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=2,217,408,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11550/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=2,217,600,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=11551/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=2,217,792,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11552/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=2,217,984,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11553/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=2,218,176,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11554/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=2,218,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11555/500000] + train/ActionL1Loss=0.0345 + throughput/total_tokens=2,218,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11556/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=2,218,752,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11557/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=2,218,944,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11558/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=2,219,136,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11559/500000] + train/ActionL1Loss=0.0342 + throughput/total_tokens=2,219,328,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11560/500000] + optim/total_grad_norm=8.331 + train/ActionL1Loss=0.0320 + throughput/total_tokens=2,219,520,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11561/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=2,219,712,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11562/500000] + train/ActionL1Loss=0.0315 + throughput/total_tokens=2,219,904,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11563/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=2,220,096,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11564/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=2,220,288,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11565/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=2,220,480,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11566/500000] + train/ActionL1Loss=0.0341 + throughput/total_tokens=2,220,672,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11567/500000] + train/ActionL1Loss=0.0607 + throughput/total_tokens=2,220,864,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11568/500000] + train/ActionL1Loss=0.0587 + throughput/total_tokens=2,221,056,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11569/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=2,221,248,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11570/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=2,221,440,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11571/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=2,221,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11572/500000] + train/ActionL1Loss=0.0249 + throughput/total_tokens=2,221,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11573/500000] + train/ActionL1Loss=0.0342 + throughput/total_tokens=2,222,016,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11574/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=2,222,208,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11575/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=2,222,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11576/500000] + train/ActionL1Loss=0.0286 + throughput/total_tokens=2,222,592,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11577/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=2,222,784,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11578/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=2,222,976,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11579/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=2,223,168,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11580/500000] + optim/total_grad_norm=8.204 + train/ActionL1Loss=0.0324 + throughput/total_tokens=2,223,360,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11581/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=2,223,552,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11582/500000] + train/ActionL1Loss=0.0355 + throughput/total_tokens=2,223,744,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11583/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=2,223,936,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11584/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=2,224,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11585/500000] + train/ActionL1Loss=0.0318 + throughput/total_tokens=2,224,320,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11586/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=2,224,512,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11587/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=2,224,704,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11588/500000] + train/ActionL1Loss=0.0356 + throughput/total_tokens=2,224,896,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11589/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=2,225,088,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11590/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=2,225,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11591/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=2,225,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11592/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=2,225,664,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11593/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=2,225,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11594/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=2,226,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11595/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=2,226,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11596/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=2,226,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11597/500000] + train/ActionL1Loss=0.0341 + throughput/total_tokens=2,226,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11598/500000] + train/ActionL1Loss=0.0401 + throughput/total_tokens=2,226,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11599/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=2,227,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11600/500000] + optim/total_grad_norm=9.681 + train/ActionL1Loss=0.0498 + throughput/total_tokens=2,227,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11601/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=2,227,392,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11602/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=2,227,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11603/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=2,227,776,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11604/500000] + train/ActionL1Loss=0.0369 + throughput/total_tokens=2,227,968,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11605/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=2,228,160,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11606/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=2,228,352,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11607/500000] + train/ActionL1Loss=0.0314 + throughput/total_tokens=2,228,544,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11608/500000] + train/ActionL1Loss=0.0580 + throughput/total_tokens=2,228,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11609/500000] + train/ActionL1Loss=0.0372 + throughput/total_tokens=2,228,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11610/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=2,229,120,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11611/500000] + train/ActionL1Loss=0.0574 + throughput/total_tokens=2,229,312,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11612/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=2,229,504,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11613/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=2,229,696,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11614/500000] + train/ActionL1Loss=0.0340 + throughput/total_tokens=2,229,888,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11615/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=2,230,080,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11616/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=2,230,272,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11617/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=2,230,464,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11618/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=2,230,656,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11619/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=2,230,848,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11620/500000] + optim/total_grad_norm=8.394 + train/ActionL1Loss=0.0323 + throughput/total_tokens=2,231,040,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11621/500000] + train/ActionL1Loss=0.0332 + throughput/total_tokens=2,231,232,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11622/500000] + train/ActionL1Loss=0.0148 + throughput/total_tokens=2,231,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11623/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,231,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11624/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=2,231,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11625/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=2,232,000,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11626/500000] + train/ActionL1Loss=0.0287 + throughput/total_tokens=2,232,192,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11627/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=2,232,384,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11628/500000] + train/ActionL1Loss=0.0354 + throughput/total_tokens=2,232,576,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11629/500000] + train/ActionL1Loss=0.0350 + throughput/total_tokens=2,232,768,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11630/500000] + train/ActionL1Loss=0.0341 + throughput/total_tokens=2,232,960,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11631/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=2,233,152,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11632/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=2,233,344,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11633/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=2,233,536,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11634/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=2,233,728,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11635/500000] + train/ActionL1Loss=0.0313 + throughput/total_tokens=2,233,920,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11636/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=2,234,112,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11637/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=2,234,304,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11638/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=2,234,496,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11639/500000] + train/ActionL1Loss=0.0649 + throughput/total_tokens=2,234,688,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11640/500000] + optim/total_grad_norm=6.614 + train/ActionL1Loss=0.0489 + throughput/total_tokens=2,234,880,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11641/500000] + train/ActionL1Loss=0.0344 + throughput/total_tokens=2,235,072,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11642/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=2,235,264,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11643/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=2,235,456,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11644/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=2,235,648,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11645/500000] + train/ActionL1Loss=0.0373 + throughput/total_tokens=2,235,840,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11646/500000] + train/ActionL1Loss=0.0320 + throughput/total_tokens=2,236,032,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11647/500000] + train/ActionL1Loss=0.0295 + throughput/total_tokens=2,236,224,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11648/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=2,236,416,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11649/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=2,236,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11650/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=2,236,800,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11651/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=2,236,992,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11652/500000] + train/ActionL1Loss=0.0532 + throughput/total_tokens=2,237,184,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11653/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=2,237,376,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11654/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=2,237,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11655/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=2,237,760,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11656/500000] + train/ActionL1Loss=0.0550 + throughput/total_tokens=2,237,952,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11657/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=2,238,144,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11658/500000] + train/ActionL1Loss=0.0394 + throughput/total_tokens=2,238,336,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11659/500000] + train/ActionL1Loss=0.0358 + throughput/total_tokens=2,238,528,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11660/500000] + optim/total_grad_norm=7.707 + train/ActionL1Loss=0.0573 + throughput/total_tokens=2,238,720,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11661/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=2,238,912,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11662/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=2,239,104,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11663/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=2,239,296,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11664/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=2,239,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11665/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,239,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11666/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=2,239,872,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11667/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=2,240,064,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11668/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=2,240,256,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11669/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=2,240,448,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11670/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=2,240,640,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=11671/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=2,240,832,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11672/500000] + train/ActionL1Loss=0.0344 + throughput/total_tokens=2,241,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11673/500000] + train/ActionL1Loss=0.0390 + throughput/total_tokens=2,241,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11674/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=2,241,408,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11675/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=2,241,600,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11676/500000] + train/ActionL1Loss=0.0250 + throughput/total_tokens=2,241,792,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11677/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=2,241,984,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11678/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=2,242,176,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11679/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=2,242,368,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11680/500000] + optim/total_grad_norm=6.544 + train/ActionL1Loss=0.0470 + throughput/total_tokens=2,242,560,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11681/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=2,242,752,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11682/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=2,242,944,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11683/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=2,243,136,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11684/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=2,243,328,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11685/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=2,243,520,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11686/500000] + train/ActionL1Loss=0.0278 + throughput/total_tokens=2,243,712,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11687/500000] + train/ActionL1Loss=0.0477 + throughput/total_tokens=2,243,904,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11688/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=2,244,096,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11689/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=2,244,288,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11690/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=2,244,480,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11691/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=2,244,672,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11692/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=2,244,864,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11693/500000] + train/ActionL1Loss=0.0283 + throughput/total_tokens=2,245,056,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11694/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=2,245,248,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11695/500000] + train/ActionL1Loss=0.0334 + throughput/total_tokens=2,245,440,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11696/500000] + train/ActionL1Loss=0.0289 + throughput/total_tokens=2,245,632,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11697/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=2,245,824,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11698/500000] + train/ActionL1Loss=0.0368 + throughput/total_tokens=2,246,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11699/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=2,246,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11700/500000] + optim/total_grad_norm=7.640 + train/ActionL1Loss=0.0577 + throughput/total_tokens=2,246,400,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11701/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=2,246,592,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11702/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=2,246,784,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11703/500000] + train/ActionL1Loss=0.0228 + throughput/total_tokens=2,246,976,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=11704/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=2,247,168,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11705/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=2,247,360,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11706/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=2,247,552,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11707/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=2,247,744,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11708/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=2,247,936,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11709/500000] + train/ActionL1Loss=0.0366 + throughput/total_tokens=2,248,128,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11710/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=2,248,320,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11711/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=2,248,512,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=11712/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=2,248,704,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11713/500000] + train/ActionL1Loss=0.0341 + throughput/total_tokens=2,248,896,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11714/500000] + train/ActionL1Loss=0.0567 + throughput/total_tokens=2,249,088,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11715/500000] + train/ActionL1Loss=0.0364 + throughput/total_tokens=2,249,280,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=11716/500000] + train/ActionL1Loss=0.0268 + throughput/total_tokens=2,249,472,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=11717/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=2,249,664,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=11718/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=2,249,856,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=11719/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=2,250,048,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=11720/500000] + optim/total_grad_norm=8.067 + train/ActionL1Loss=0.0522 + throughput/total_tokens=2,250,240,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11721/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=2,250,432,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11722/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=2,250,624,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11723/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=2,250,816,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11724/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=2,251,008,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11725/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=2,251,200,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11726/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=2,251,392,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11727/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=2,251,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11728/500000] + train/ActionL1Loss=0.0288 + throughput/total_tokens=2,251,776,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11729/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=2,251,968,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11730/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=2,252,160,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11731/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=2,252,352,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11732/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=2,252,544,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11733/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=2,252,736,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11734/500000] + train/ActionL1Loss=0.0632 + throughput/total_tokens=2,252,928,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11735/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=2,253,120,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11736/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=2,253,312,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11737/500000] + train/ActionL1Loss=0.0387 + throughput/total_tokens=2,253,504,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11738/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=2,253,696,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11739/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=2,253,888,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11740/500000] + optim/total_grad_norm=7.682 + train/ActionL1Loss=0.0282 + throughput/total_tokens=2,254,080,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11741/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=2,254,272,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11742/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=2,254,464,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11743/500000] + train/ActionL1Loss=0.0349 + throughput/total_tokens=2,254,656,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11744/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=2,254,848,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11745/500000] + train/ActionL1Loss=0.0332 + throughput/total_tokens=2,255,040,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11746/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=2,255,232,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11747/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=2,255,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11748/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=2,255,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11749/500000] + train/ActionL1Loss=0.0553 + throughput/total_tokens=2,255,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11750/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=2,256,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11751/500000] + train/ActionL1Loss=0.0272 + throughput/total_tokens=2,256,192,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11752/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=2,256,384,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11753/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=2,256,576,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11754/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=2,256,768,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11755/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=2,256,960,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11756/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=2,257,152,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11757/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=2,257,344,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11758/500000] + train/ActionL1Loss=0.0294 + throughput/total_tokens=2,257,536,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11759/500000] + train/ActionL1Loss=0.0287 + throughput/total_tokens=2,257,728,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11760/500000] + optim/total_grad_norm=7.789 + train/ActionL1Loss=0.0395 + throughput/total_tokens=2,257,920,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11761/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=2,258,112,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11762/500000] + train/ActionL1Loss=0.0311 + throughput/total_tokens=2,258,304,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11763/500000] + train/ActionL1Loss=0.0356 + throughput/total_tokens=2,258,496,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11764/500000] + train/ActionL1Loss=0.0315 + throughput/total_tokens=2,258,688,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11765/500000] + train/ActionL1Loss=0.0317 + throughput/total_tokens=2,258,880,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11766/500000] + train/ActionL1Loss=0.0311 + throughput/total_tokens=2,259,072,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11767/500000] + train/ActionL1Loss=0.0250 + throughput/total_tokens=2,259,264,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11768/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=2,259,456,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11769/500000] + train/ActionL1Loss=0.0182 + throughput/total_tokens=2,259,648,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=11770/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=2,259,840,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11771/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=2,260,032,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11772/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=2,260,224,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11773/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=2,260,416,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11774/500000] + train/ActionL1Loss=0.0349 + throughput/total_tokens=2,260,608,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11775/500000] + train/ActionL1Loss=0.0292 + throughput/total_tokens=2,260,800,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11776/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=2,260,992,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11777/500000] + train/ActionL1Loss=0.0336 + throughput/total_tokens=2,261,184,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11778/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=2,261,376,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11779/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=2,261,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11780/500000] + optim/total_grad_norm=8.535 + train/ActionL1Loss=0.0344 + throughput/total_tokens=2,261,760,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11781/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=2,261,952,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11782/500000] + train/ActionL1Loss=0.0592 + throughput/total_tokens=2,262,144,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11783/500000] + train/ActionL1Loss=0.0291 + throughput/total_tokens=2,262,336,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11784/500000] + train/ActionL1Loss=0.0316 + throughput/total_tokens=2,262,528,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11785/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=2,262,720,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11786/500000] + train/ActionL1Loss=0.0480 + throughput/total_tokens=2,262,912,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11787/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=2,263,104,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11788/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,263,296,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11789/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=2,263,488,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11790/500000] + train/ActionL1Loss=0.0328 + throughput/total_tokens=2,263,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11791/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=2,263,872,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11792/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=2,264,064,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11793/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=2,264,256,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11794/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=2,264,448,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11795/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=2,264,640,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11796/500000] + train/ActionL1Loss=0.0491 + throughput/total_tokens=2,264,832,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11797/500000] + train/ActionL1Loss=0.0341 + throughput/total_tokens=2,265,024,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11798/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=2,265,216,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11799/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=2,265,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11800/500000] + optim/total_grad_norm=7.082 + train/ActionL1Loss=0.0370 + throughput/total_tokens=2,265,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11801/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,265,792,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11802/500000] + train/ActionL1Loss=0.0404 + throughput/total_tokens=2,265,984,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11803/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,266,176,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11804/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=2,266,368,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11805/500000] + train/ActionL1Loss=0.0411 + throughput/total_tokens=2,266,560,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11806/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=2,266,752,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11807/500000] + train/ActionL1Loss=0.0309 + throughput/total_tokens=2,266,944,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=11808/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=2,267,136,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=11809/500000] + train/ActionL1Loss=0.0356 + throughput/total_tokens=2,267,328,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11810/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=2,267,520,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11811/500000] + train/ActionL1Loss=0.0324 + throughput/total_tokens=2,267,712,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11812/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=2,267,904,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11813/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=2,268,096,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11814/500000] + train/ActionL1Loss=0.0525 + throughput/total_tokens=2,268,288,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11815/500000] + train/ActionL1Loss=0.0300 + throughput/total_tokens=2,268,480,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11816/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=2,268,672,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11817/500000] + train/ActionL1Loss=0.0576 + throughput/total_tokens=2,268,864,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11818/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=2,269,056,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11819/500000] + train/ActionL1Loss=0.0280 + throughput/total_tokens=2,269,248,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11820/500000] + optim/total_grad_norm=8.062 + train/ActionL1Loss=0.0431 + throughput/total_tokens=2,269,440,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11821/500000] + train/ActionL1Loss=0.0446 + throughput/total_tokens=2,269,632,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11822/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=2,269,824,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11823/500000] + train/ActionL1Loss=0.0505 + throughput/total_tokens=2,270,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11824/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=2,270,208,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11825/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=2,270,400,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11826/500000] + train/ActionL1Loss=0.0421 + throughput/total_tokens=2,270,592,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11827/500000] + train/ActionL1Loss=0.0494 + throughput/total_tokens=2,270,784,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11828/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=2,270,976,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11829/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=2,271,168,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11830/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=2,271,360,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11831/500000] + train/ActionL1Loss=0.0276 + throughput/total_tokens=2,271,552,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11832/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=2,271,744,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11833/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=2,271,936,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11834/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=2,272,128,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11835/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=2,272,320,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11836/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=2,272,512,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11837/500000] + train/ActionL1Loss=0.0540 + throughput/total_tokens=2,272,704,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11838/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=2,272,896,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11839/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=2,273,088,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11840/500000] + optim/total_grad_norm=7.707 + train/ActionL1Loss=0.0544 + throughput/total_tokens=2,273,280,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11841/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=2,273,472,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11842/500000] + train/ActionL1Loss=0.0250 + throughput/total_tokens=2,273,664,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11843/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=2,273,856,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11844/500000] + train/ActionL1Loss=0.0353 + throughput/total_tokens=2,274,048,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11845/500000] + train/ActionL1Loss=0.0450 + throughput/total_tokens=2,274,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11846/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=2,274,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11847/500000] + train/ActionL1Loss=0.0412 + throughput/total_tokens=2,274,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11848/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=2,274,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11849/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=2,275,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11850/500000] + train/ActionL1Loss=0.0343 + throughput/total_tokens=2,275,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11851/500000] + train/ActionL1Loss=0.0313 + throughput/total_tokens=2,275,392,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11852/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=2,275,584,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11853/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=2,275,776,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11854/500000] + train/ActionL1Loss=0.0245 + throughput/total_tokens=2,275,968,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11855/500000] + train/ActionL1Loss=0.0355 + throughput/total_tokens=2,276,160,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11856/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=2,276,352,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11857/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=2,276,544,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11858/500000] + train/ActionL1Loss=0.0284 + throughput/total_tokens=2,276,736,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11859/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=2,276,928,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11860/500000] + optim/total_grad_norm=8.576 + train/ActionL1Loss=0.0376 + throughput/total_tokens=2,277,120,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=11861/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=2,277,312,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=11862/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=2,277,504,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11863/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=2,277,696,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11864/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=2,277,888,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11865/500000] + train/ActionL1Loss=0.0350 + throughput/total_tokens=2,278,080,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11866/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=2,278,272,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11867/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=2,278,464,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11868/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=2,278,656,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11869/500000] + train/ActionL1Loss=0.0324 + throughput/total_tokens=2,278,848,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11870/500000] + train/ActionL1Loss=0.0574 + throughput/total_tokens=2,279,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11871/500000] + train/ActionL1Loss=0.0333 + throughput/total_tokens=2,279,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11872/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=2,279,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11873/500000] + train/ActionL1Loss=0.0385 + throughput/total_tokens=2,279,616,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11874/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=2,279,808,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11875/500000] + train/ActionL1Loss=0.0372 + throughput/total_tokens=2,280,000,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11876/500000] + train/ActionL1Loss=0.0347 + throughput/total_tokens=2,280,192,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11877/500000] + train/ActionL1Loss=0.0476 + throughput/total_tokens=2,280,384,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11878/500000] + train/ActionL1Loss=0.0542 + throughput/total_tokens=2,280,576,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11879/500000] + train/ActionL1Loss=0.0331 + throughput/total_tokens=2,280,768,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11880/500000] + optim/total_grad_norm=8.369 + train/ActionL1Loss=0.0536 + throughput/total_tokens=2,280,960,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=11881/500000] + train/ActionL1Loss=0.0339 + throughput/total_tokens=2,281,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11882/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=2,281,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11883/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=2,281,536,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11884/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=2,281,728,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11885/500000] + train/ActionL1Loss=0.0356 + throughput/total_tokens=2,281,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11886/500000] + train/ActionL1Loss=0.0328 + throughput/total_tokens=2,282,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11887/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=2,282,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11888/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=2,282,496,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11889/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=2,282,688,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11890/500000] + train/ActionL1Loss=0.0546 + throughput/total_tokens=2,282,880,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11891/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=2,283,072,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11892/500000] + train/ActionL1Loss=0.0369 + throughput/total_tokens=2,283,264,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11893/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=2,283,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11894/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=2,283,648,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11895/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=2,283,840,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11896/500000] + train/ActionL1Loss=0.0141 + throughput/total_tokens=2,284,032,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11897/500000] + train/ActionL1Loss=0.0654 + throughput/total_tokens=2,284,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11898/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=2,284,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11899/500000] + train/ActionL1Loss=0.0346 + throughput/total_tokens=2,284,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11900/500000] + optim/total_grad_norm=9.461 + train/ActionL1Loss=0.0469 + throughput/total_tokens=2,284,800,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11901/500000] + train/ActionL1Loss=0.0481 + throughput/total_tokens=2,284,992,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11902/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=2,285,184,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11903/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=2,285,376,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11904/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=2,285,568,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11905/500000] + train/ActionL1Loss=0.0234 + throughput/total_tokens=2,285,760,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11906/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=2,285,952,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11907/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=2,286,144,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11908/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=2,286,336,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11909/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=2,286,528,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11910/500000] + train/ActionL1Loss=0.0501 + throughput/total_tokens=2,286,720,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11911/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=2,286,912,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11912/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=2,287,104,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11913/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=2,287,296,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11914/500000] + train/ActionL1Loss=0.0487 + throughput/total_tokens=2,287,488,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11915/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=2,287,680,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11916/500000] + train/ActionL1Loss=0.0321 + throughput/total_tokens=2,287,872,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11917/500000] + train/ActionL1Loss=0.0313 + throughput/total_tokens=2,288,064,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=11918/500000] + train/ActionL1Loss=0.0452 + throughput/total_tokens=2,288,256,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11919/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=2,288,448,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11920/500000] + optim/total_grad_norm=8.746 + train/ActionL1Loss=0.0351 + throughput/total_tokens=2,288,640,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=11921/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=2,288,832,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11922/500000] + train/ActionL1Loss=0.0294 + throughput/total_tokens=2,289,024,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11923/500000] + train/ActionL1Loss=0.0547 + throughput/total_tokens=2,289,216,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11924/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=2,289,408,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11925/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=2,289,600,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11926/500000] + train/ActionL1Loss=0.0464 + throughput/total_tokens=2,289,792,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11927/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=2,289,984,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11928/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=2,290,176,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11929/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=2,290,368,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11930/500000] + train/ActionL1Loss=0.0286 + throughput/total_tokens=2,290,560,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11931/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=2,290,752,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11932/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=2,290,944,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11933/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=2,291,136,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11934/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=2,291,328,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11935/500000] + train/ActionL1Loss=0.0271 + throughput/total_tokens=2,291,520,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11936/500000] + train/ActionL1Loss=0.0528 + throughput/total_tokens=2,291,712,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11937/500000] + train/ActionL1Loss=0.0317 + throughput/total_tokens=2,291,904,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11938/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=2,292,096,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11939/500000] + train/ActionL1Loss=0.0646 + throughput/total_tokens=2,292,288,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11940/500000] + optim/total_grad_norm=7.057 + train/ActionL1Loss=0.0509 + throughput/total_tokens=2,292,480,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=11941/500000] + train/ActionL1Loss=0.0617 + throughput/total_tokens=2,292,672,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=11942/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=2,292,864,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=11943/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=2,293,056,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11944/500000] + train/ActionL1Loss=0.0335 + throughput/total_tokens=2,293,248,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11945/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=2,293,440,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11946/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=2,293,632,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11947/500000] + train/ActionL1Loss=0.0509 + throughput/total_tokens=2,293,824,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11948/500000] + train/ActionL1Loss=0.0352 + throughput/total_tokens=2,294,016,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=11949/500000] + train/ActionL1Loss=0.0504 + throughput/total_tokens=2,294,208,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=11950/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=2,294,400,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=11951/500000] + train/ActionL1Loss=0.0340 + throughput/total_tokens=2,294,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11952/500000] + train/ActionL1Loss=0.0283 + throughput/total_tokens=2,294,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11953/500000] + train/ActionL1Loss=0.0364 + throughput/total_tokens=2,294,976,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11954/500000] + train/ActionL1Loss=0.0225 + throughput/total_tokens=2,295,168,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11955/500000] + train/ActionL1Loss=0.0534 + throughput/total_tokens=2,295,360,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11956/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=2,295,552,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11957/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=2,295,744,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11958/500000] + train/ActionL1Loss=0.0298 + throughput/total_tokens=2,295,936,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11959/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=2,296,128,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11960/500000] + optim/total_grad_norm=8.231 + train/ActionL1Loss=0.0455 + throughput/total_tokens=2,296,320,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=11961/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=2,296,512,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11962/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=2,296,704,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11963/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=2,296,896,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11964/500000] + train/ActionL1Loss=0.0349 + throughput/total_tokens=2,297,088,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11965/500000] + train/ActionL1Loss=0.0382 + throughput/total_tokens=2,297,280,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11966/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=2,297,472,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11967/500000] + train/ActionL1Loss=0.0327 + throughput/total_tokens=2,297,664,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11968/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=2,297,856,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=11969/500000] + train/ActionL1Loss=0.0348 + throughput/total_tokens=2,298,048,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=11970/500000] + train/ActionL1Loss=0.0465 + throughput/total_tokens=2,298,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11971/500000] + train/ActionL1Loss=0.0373 + throughput/total_tokens=2,298,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11972/500000] + train/ActionL1Loss=0.0355 + throughput/total_tokens=2,298,624,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11973/500000] + train/ActionL1Loss=0.0558 + throughput/total_tokens=2,298,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11974/500000] + train/ActionL1Loss=0.0315 + throughput/total_tokens=2,299,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11975/500000] + train/ActionL1Loss=0.0585 + throughput/total_tokens=2,299,200,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11976/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=2,299,392,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11977/500000] + train/ActionL1Loss=0.0235 + throughput/total_tokens=2,299,584,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11978/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=2,299,776,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11979/500000] + train/ActionL1Loss=0.0545 + throughput/total_tokens=2,299,968,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11980/500000] + optim/total_grad_norm=7.492 + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,300,160,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11981/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=2,300,352,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11982/500000] + train/ActionL1Loss=0.0425 + throughput/total_tokens=2,300,544,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11983/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=2,300,736,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=11984/500000] + train/ActionL1Loss=0.0506 + throughput/total_tokens=2,300,928,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11985/500000] + train/ActionL1Loss=0.0531 + throughput/total_tokens=2,301,120,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11986/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=2,301,312,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11987/500000] + train/ActionL1Loss=0.0355 + throughput/total_tokens=2,301,504,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11988/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=2,301,696,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11989/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=2,301,888,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11990/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=2,302,080,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=11991/500000] + train/ActionL1Loss=0.0503 + throughput/total_tokens=2,302,272,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11992/500000] + train/ActionL1Loss=0.0234 + throughput/total_tokens=2,302,464,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=11993/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=2,302,656,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11994/500000] + train/ActionL1Loss=0.0448 + throughput/total_tokens=2,302,848,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11995/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=2,303,040,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11996/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=2,303,232,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11997/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=2,303,424,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=11998/500000] + train/ActionL1Loss=0.0314 + throughput/total_tokens=2,303,616,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=11999/500000] + train/ActionL1Loss=0.0572 + throughput/total_tokens=2,303,808,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12000/500000] + optim/total_grad_norm=9.680 + train/ActionL1Loss=0.0540 + throughput/total_tokens=2,304,000,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +10/14 [14:28:03] INFO | >> Saving config... checkpoint.py:608 +10/14 [14:28:50] INFO | >> Saving model state... checkpoint.py:796 +10/14 [14:30:01] INFO | >> Saving optim state... checkpoint.py:811 +10/14 [14:31:31] INFO | >> Saving trainer state... checkpoint.py:670 + INFO | >> Saving config... checkpoint.py:608 +[step=12001/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=2,304,192,000 + throughput/device/tokens_per_second=1,207 + throughput/device/batches_per_second=0.0503 +[step=12002/500000] + train/ActionL1Loss=0.0502 + throughput/total_tokens=2,304,384,000 + throughput/device/tokens_per_second=1,182 + throughput/device/batches_per_second=0.0493 +[step=12003/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=2,304,576,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12004/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=2,304,768,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12005/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=2,304,960,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12006/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=2,305,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12007/500000] + train/ActionL1Loss=0.0443 + throughput/total_tokens=2,305,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=12008/500000] + train/ActionL1Loss=0.0357 + throughput/total_tokens=2,305,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12009/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=2,305,728,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12010/500000] + train/ActionL1Loss=0.0372 + throughput/total_tokens=2,305,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=12011/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=2,306,112,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12012/500000] + train/ActionL1Loss=0.0392 + throughput/total_tokens=2,306,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12013/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=2,306,496,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12014/500000] + train/ActionL1Loss=0.0339 + throughput/total_tokens=2,306,688,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12015/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=2,306,880,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12016/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=2,307,072,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12017/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=2,307,264,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12018/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=2,307,456,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12019/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=2,307,648,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12020/500000] + optim/total_grad_norm=8.085 + train/ActionL1Loss=0.0541 + throughput/total_tokens=2,307,840,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=12021/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=2,308,032,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12022/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=2,308,224,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12023/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=2,308,416,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12024/500000] + train/ActionL1Loss=0.0365 + throughput/total_tokens=2,308,608,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12025/500000] + train/ActionL1Loss=0.0331 + throughput/total_tokens=2,308,800,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12026/500000] + train/ActionL1Loss=0.0376 + throughput/total_tokens=2,308,992,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12027/500000] + train/ActionL1Loss=0.0336 + throughput/total_tokens=2,309,184,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12028/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=2,309,376,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12029/500000] + train/ActionL1Loss=0.0319 + throughput/total_tokens=2,309,568,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12030/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=2,309,760,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=12031/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=2,309,952,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12032/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=2,310,144,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12033/500000] + train/ActionL1Loss=0.0493 + throughput/total_tokens=2,310,336,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12034/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=2,310,528,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12035/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=2,310,720,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12036/500000] + train/ActionL1Loss=0.0338 + throughput/total_tokens=2,310,912,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12037/500000] + train/ActionL1Loss=0.0555 + throughput/total_tokens=2,311,104,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12038/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=2,311,296,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12039/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=2,311,488,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12040/500000] + optim/total_grad_norm=9.444 + train/ActionL1Loss=0.0493 + throughput/total_tokens=2,311,680,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=12041/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=2,311,872,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12042/500000] + train/ActionL1Loss=0.0468 + throughput/total_tokens=2,312,064,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12043/500000] + train/ActionL1Loss=0.0407 + throughput/total_tokens=2,312,256,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12044/500000] + train/ActionL1Loss=0.0438 + throughput/total_tokens=2,312,448,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=12045/500000] + train/ActionL1Loss=0.0269 + throughput/total_tokens=2,312,640,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12046/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=2,312,832,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12047/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=2,313,024,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12048/500000] + train/ActionL1Loss=0.0511 + throughput/total_tokens=2,313,216,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12049/500000] + train/ActionL1Loss=0.0538 + throughput/total_tokens=2,313,408,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=12050/500000] + train/ActionL1Loss=0.0472 + throughput/total_tokens=2,313,600,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=12051/500000] + train/ActionL1Loss=0.0255 + throughput/total_tokens=2,313,792,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12052/500000] + train/ActionL1Loss=0.0323 + throughput/total_tokens=2,313,984,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12053/500000] + train/ActionL1Loss=0.0337 + throughput/total_tokens=2,314,176,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12054/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=2,314,368,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12055/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=2,314,560,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12056/500000] + train/ActionL1Loss=0.0429 + throughput/total_tokens=2,314,752,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12057/500000] + train/ActionL1Loss=0.0222 + throughput/total_tokens=2,314,944,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12058/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=2,315,136,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12059/500000] + train/ActionL1Loss=0.0527 + throughput/total_tokens=2,315,328,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12060/500000] + optim/total_grad_norm=7.900 + train/ActionL1Loss=0.0429 + throughput/total_tokens=2,315,520,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 + System/Peak GPU Memory (MB)=46,924 +[step=12061/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=2,315,712,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=12062/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=2,315,904,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=12063/500000] + train/ActionL1Loss=0.0374 + throughput/total_tokens=2,316,096,000 + throughput/device/tokens_per_second=1,172 + throughput/device/batches_per_second=0.0489 +[step=12064/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=2,316,288,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=12065/500000] + train/ActionL1Loss=0.0343 + throughput/total_tokens=2,316,480,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=12066/500000] + train/ActionL1Loss=0.0315 + throughput/total_tokens=2,316,672,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=12067/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=2,316,864,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=12068/500000] + train/ActionL1Loss=0.0355 + throughput/total_tokens=2,317,056,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=12069/500000] + train/ActionL1Loss=0.0372 + throughput/total_tokens=2,317,248,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=12070/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=2,317,440,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=12071/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=2,317,632,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12072/500000] + train/ActionL1Loss=0.0359 + throughput/total_tokens=2,317,824,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12073/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=2,318,016,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12074/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=2,318,208,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12075/500000] + train/ActionL1Loss=0.0215 + throughput/total_tokens=2,318,400,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12076/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=2,318,592,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12077/500000] + train/ActionL1Loss=0.0442 + throughput/total_tokens=2,318,784,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12078/500000] + train/ActionL1Loss=0.0410 + throughput/total_tokens=2,318,976,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12079/500000] + train/ActionL1Loss=0.0391 + throughput/total_tokens=2,319,168,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12080/500000] + optim/total_grad_norm=6.728 + train/ActionL1Loss=0.0317 + throughput/total_tokens=2,319,360,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=12081/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=2,319,552,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=12082/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=2,319,744,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12083/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=2,319,936,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12084/500000] + train/ActionL1Loss=0.0383 + throughput/total_tokens=2,320,128,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12085/500000] + train/ActionL1Loss=0.0349 + throughput/total_tokens=2,320,320,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12086/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=2,320,512,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12087/500000] + train/ActionL1Loss=0.0387 + throughput/total_tokens=2,320,704,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12088/500000] + train/ActionL1Loss=0.0612 + throughput/total_tokens=2,320,896,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12089/500000] + train/ActionL1Loss=0.0471 + throughput/total_tokens=2,321,088,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=12090/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=2,321,280,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=12091/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=2,321,472,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=12092/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=2,321,664,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=12093/500000] + train/ActionL1Loss=0.0356 + throughput/total_tokens=2,321,856,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12094/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=2,322,048,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 +[step=12095/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=2,322,240,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12096/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=2,322,432,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12097/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=2,322,624,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12098/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=2,322,816,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12099/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=2,323,008,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12100/500000] + optim/total_grad_norm=9.061 + train/ActionL1Loss=0.0466 + throughput/total_tokens=2,323,200,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=12101/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=2,323,392,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12102/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=2,323,584,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12103/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=2,323,776,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12104/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=2,323,968,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12105/500000] + train/ActionL1Loss=0.0447 + throughput/total_tokens=2,324,160,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12106/500000] + train/ActionL1Loss=0.0271 + throughput/total_tokens=2,324,352,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12107/500000] + train/ActionL1Loss=0.0479 + throughput/total_tokens=2,324,544,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12108/500000] + train/ActionL1Loss=0.0325 + throughput/total_tokens=2,324,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12109/500000] + train/ActionL1Loss=0.0519 + throughput/total_tokens=2,324,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12110/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=2,325,120,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=12111/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=2,325,312,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12112/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=2,325,504,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12113/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=2,325,696,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12114/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=2,325,888,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12115/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=2,326,080,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12116/500000] + train/ActionL1Loss=0.0539 + throughput/total_tokens=2,326,272,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12117/500000] + train/ActionL1Loss=0.0460 + throughput/total_tokens=2,326,464,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12118/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=2,326,656,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12119/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=2,326,848,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12120/500000] + optim/total_grad_norm=9.269 + train/ActionL1Loss=0.0492 + throughput/total_tokens=2,327,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=12121/500000] + train/ActionL1Loss=0.0474 + throughput/total_tokens=2,327,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12122/500000] + train/ActionL1Loss=0.0386 + throughput/total_tokens=2,327,424,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12123/500000] + train/ActionL1Loss=0.0314 + throughput/total_tokens=2,327,616,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12124/500000] + train/ActionL1Loss=0.0379 + throughput/total_tokens=2,327,808,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=12125/500000] + train/ActionL1Loss=0.0451 + throughput/total_tokens=2,328,000,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12126/500000] + train/ActionL1Loss=0.0478 + throughput/total_tokens=2,328,192,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12127/500000] + train/ActionL1Loss=0.0285 + throughput/total_tokens=2,328,384,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=12128/500000] + train/ActionL1Loss=0.0455 + throughput/total_tokens=2,328,576,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12129/500000] + train/ActionL1Loss=0.0237 + throughput/total_tokens=2,328,768,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12130/500000] + train/ActionL1Loss=0.0578 + throughput/total_tokens=2,328,960,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=12131/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=2,329,152,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12132/500000] + train/ActionL1Loss=0.0364 + throughput/total_tokens=2,329,344,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12133/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=2,329,536,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12134/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=2,329,728,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12135/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=2,329,920,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12136/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=2,330,112,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12137/500000] + train/ActionL1Loss=0.0423 + throughput/total_tokens=2,330,304,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12138/500000] + train/ActionL1Loss=0.0470 + throughput/total_tokens=2,330,496,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12139/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=2,330,688,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12140/500000] + optim/total_grad_norm=8.609 + train/ActionL1Loss=0.0485 + throughput/total_tokens=2,330,880,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=12141/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=2,331,072,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12142/500000] + train/ActionL1Loss=0.0286 + throughput/total_tokens=2,331,264,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12143/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=2,331,456,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12144/500000] + train/ActionL1Loss=0.0405 + throughput/total_tokens=2,331,648,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12145/500000] + train/ActionL1Loss=0.0473 + throughput/total_tokens=2,331,840,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12146/500000] + train/ActionL1Loss=0.0334 + throughput/total_tokens=2,332,032,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12147/500000] + train/ActionL1Loss=0.0367 + throughput/total_tokens=2,332,224,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12148/500000] + train/ActionL1Loss=0.0560 + throughput/total_tokens=2,332,416,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12149/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=2,332,608,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12150/500000] + train/ActionL1Loss=0.0469 + throughput/total_tokens=2,332,800,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=12151/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=2,332,992,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12152/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=2,333,184,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12153/500000] + train/ActionL1Loss=0.0575 + throughput/total_tokens=2,333,376,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12154/500000] + train/ActionL1Loss=0.0462 + throughput/total_tokens=2,333,568,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=12155/500000] + train/ActionL1Loss=0.0445 + throughput/total_tokens=2,333,760,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=12156/500000] + train/ActionL1Loss=0.0559 + throughput/total_tokens=2,333,952,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12157/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=2,334,144,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12158/500000] + train/ActionL1Loss=0.0219 + throughput/total_tokens=2,334,336,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=12159/500000] + train/ActionL1Loss=0.0402 + throughput/total_tokens=2,334,528,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12160/500000] + optim/total_grad_norm=10.18 + train/ActionL1Loss=0.0291 + throughput/total_tokens=2,334,720,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=12161/500000] + train/ActionL1Loss=0.0314 + throughput/total_tokens=2,334,912,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12162/500000] + train/ActionL1Loss=0.0360 + throughput/total_tokens=2,335,104,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12163/500000] + train/ActionL1Loss=0.0334 + throughput/total_tokens=2,335,296,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12164/500000] + train/ActionL1Loss=0.0419 + throughput/total_tokens=2,335,488,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12165/500000] + train/ActionL1Loss=0.0384 + throughput/total_tokens=2,335,680,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12166/500000] + train/ActionL1Loss=0.0482 + throughput/total_tokens=2,335,872,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12167/500000] + train/ActionL1Loss=0.0381 + throughput/total_tokens=2,336,064,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12168/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=2,336,256,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12169/500000] + train/ActionL1Loss=0.0291 + throughput/total_tokens=2,336,448,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12170/500000] + train/ActionL1Loss=0.0437 + throughput/total_tokens=2,336,640,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=12171/500000] + train/ActionL1Loss=0.0348 + throughput/total_tokens=2,336,832,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12172/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=2,337,024,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12173/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=2,337,216,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12174/500000] + train/ActionL1Loss=0.0449 + throughput/total_tokens=2,337,408,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12175/500000] + train/ActionL1Loss=0.0522 + throughput/total_tokens=2,337,600,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12176/500000] + train/ActionL1Loss=0.0603 + throughput/total_tokens=2,337,792,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12177/500000] + train/ActionL1Loss=0.0302 + throughput/total_tokens=2,337,984,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12178/500000] + train/ActionL1Loss=0.0380 + throughput/total_tokens=2,338,176,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12179/500000] + train/ActionL1Loss=0.0316 + throughput/total_tokens=2,338,368,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12180/500000] + optim/total_grad_norm=9.770 + train/ActionL1Loss=0.0282 + throughput/total_tokens=2,338,560,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=12181/500000] + train/ActionL1Loss=0.0317 + throughput/total_tokens=2,338,752,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12182/500000] + train/ActionL1Loss=0.0273 + throughput/total_tokens=2,338,944,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12183/500000] + train/ActionL1Loss=0.0427 + throughput/total_tokens=2,339,136,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12184/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=2,339,328,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12185/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=2,339,520,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12186/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=2,339,712,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12187/500000] + train/ActionL1Loss=0.0409 + throughput/total_tokens=2,339,904,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12188/500000] + train/ActionL1Loss=0.0349 + throughput/total_tokens=2,340,096,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12189/500000] + train/ActionL1Loss=0.0315 + throughput/total_tokens=2,340,288,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12190/500000] + train/ActionL1Loss=0.0338 + throughput/total_tokens=2,340,480,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=12191/500000] + train/ActionL1Loss=0.0308 + throughput/total_tokens=2,340,672,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12192/500000] + train/ActionL1Loss=0.0327 + throughput/total_tokens=2,340,864,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12193/500000] + train/ActionL1Loss=0.0433 + throughput/total_tokens=2,341,056,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12194/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=2,341,248,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12195/500000] + train/ActionL1Loss=0.0332 + throughput/total_tokens=2,341,440,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12196/500000] + train/ActionL1Loss=0.0320 + throughput/total_tokens=2,341,632,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12197/500000] + train/ActionL1Loss=0.0300 + throughput/total_tokens=2,341,824,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12198/500000] + train/ActionL1Loss=0.0544 + throughput/total_tokens=2,342,016,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12199/500000] + train/ActionL1Loss=0.0336 + throughput/total_tokens=2,342,208,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12200/500000] + optim/total_grad_norm=8.993 + train/ActionL1Loss=0.0469 + throughput/total_tokens=2,342,400,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=12201/500000] + train/ActionL1Loss=0.0533 + throughput/total_tokens=2,342,592,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12202/500000] + train/ActionL1Loss=0.0255 + throughput/total_tokens=2,342,784,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=12203/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=2,342,976,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=12204/500000] + train/ActionL1Loss=0.0441 + throughput/total_tokens=2,343,168,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12205/500000] + train/ActionL1Loss=0.0395 + throughput/total_tokens=2,343,360,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12206/500000] + train/ActionL1Loss=0.0292 + throughput/total_tokens=2,343,552,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12207/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=2,343,744,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12208/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=2,343,936,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12209/500000] + train/ActionL1Loss=0.0417 + throughput/total_tokens=2,344,128,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=12210/500000] + train/ActionL1Loss=0.0400 + throughput/total_tokens=2,344,320,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=12211/500000] + train/ActionL1Loss=0.0524 + throughput/total_tokens=2,344,512,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12212/500000] + train/ActionL1Loss=0.0264 + throughput/total_tokens=2,344,704,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12213/500000] + train/ActionL1Loss=0.0486 + throughput/total_tokens=2,344,896,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12214/500000] + train/ActionL1Loss=0.0512 + throughput/total_tokens=2,345,088,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12215/500000] + train/ActionL1Loss=0.0518 + throughput/total_tokens=2,345,280,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12216/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=2,345,472,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12217/500000] + train/ActionL1Loss=0.0436 + throughput/total_tokens=2,345,664,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12218/500000] + train/ActionL1Loss=0.0424 + throughput/total_tokens=2,345,856,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12219/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=2,346,048,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12220/500000] + optim/total_grad_norm=9.750 + train/ActionL1Loss=0.0410 + throughput/total_tokens=2,346,240,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=12221/500000] + train/ActionL1Loss=0.0341 + throughput/total_tokens=2,346,432,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12222/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=2,346,624,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12223/500000] + train/ActionL1Loss=0.0475 + throughput/total_tokens=2,346,816,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12224/500000] + train/ActionL1Loss=0.0309 + throughput/total_tokens=2,347,008,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12225/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=2,347,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=12226/500000] + train/ActionL1Loss=0.0371 + throughput/total_tokens=2,347,392,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=12227/500000] + train/ActionL1Loss=0.0368 + throughput/total_tokens=2,347,584,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=12228/500000] + train/ActionL1Loss=0.0363 + throughput/total_tokens=2,347,776,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12229/500000] + train/ActionL1Loss=0.0488 + throughput/total_tokens=2,347,968,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=12230/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=2,348,160,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=12231/500000] + train/ActionL1Loss=0.0430 + throughput/total_tokens=2,348,352,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12232/500000] + train/ActionL1Loss=0.0483 + throughput/total_tokens=2,348,544,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12233/500000] + train/ActionL1Loss=0.0359 + throughput/total_tokens=2,348,736,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=12234/500000] + train/ActionL1Loss=0.0228 + throughput/total_tokens=2,348,928,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12235/500000] + train/ActionL1Loss=0.0314 + throughput/total_tokens=2,349,120,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12236/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=2,349,312,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12237/500000] + train/ActionL1Loss=0.0428 + throughput/total_tokens=2,349,504,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12238/500000] + train/ActionL1Loss=0.0582 + throughput/total_tokens=2,349,696,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12239/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=2,349,888,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12240/500000] + optim/total_grad_norm=9.185 + train/ActionL1Loss=0.0429 + throughput/total_tokens=2,350,080,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=12241/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=2,350,272,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12242/500000] + train/ActionL1Loss=0.0537 + throughput/total_tokens=2,350,464,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12243/500000] + train/ActionL1Loss=0.0290 + throughput/total_tokens=2,350,656,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12244/500000] + train/ActionL1Loss=0.0389 + throughput/total_tokens=2,350,848,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12245/500000] + train/ActionL1Loss=0.0435 + throughput/total_tokens=2,351,040,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12246/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=2,351,232,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12247/500000] + train/ActionL1Loss=0.0422 + throughput/total_tokens=2,351,424,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12248/500000] + train/ActionL1Loss=0.0498 + throughput/total_tokens=2,351,616,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12249/500000] + train/ActionL1Loss=0.0369 + throughput/total_tokens=2,351,808,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12250/500000] + train/ActionL1Loss=0.0330 + throughput/total_tokens=2,352,000,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=12251/500000] + train/ActionL1Loss=0.0350 + throughput/total_tokens=2,352,192,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=12252/500000] + train/ActionL1Loss=0.0361 + throughput/total_tokens=2,352,384,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 +[step=12253/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=2,352,576,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12254/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=2,352,768,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12255/500000] + train/ActionL1Loss=0.0489 + throughput/total_tokens=2,352,960,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12256/500000] + train/ActionL1Loss=0.0269 + throughput/total_tokens=2,353,152,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12257/500000] + train/ActionL1Loss=0.0355 + throughput/total_tokens=2,353,344,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12258/500000] + train/ActionL1Loss=0.0277 + throughput/total_tokens=2,353,536,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12259/500000] + train/ActionL1Loss=0.0348 + throughput/total_tokens=2,353,728,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12260/500000] + optim/total_grad_norm=8.395 + train/ActionL1Loss=0.0424 + throughput/total_tokens=2,353,920,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=12261/500000] + train/ActionL1Loss=0.0490 + throughput/total_tokens=2,354,112,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12262/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=2,354,304,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12263/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=2,354,496,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12264/500000] + train/ActionL1Loss=0.0403 + throughput/total_tokens=2,354,688,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12265/500000] + train/ActionL1Loss=0.0484 + throughput/total_tokens=2,354,880,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12266/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=2,355,072,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12267/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=2,355,264,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12268/500000] + train/ActionL1Loss=0.0579 + throughput/total_tokens=2,355,456,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12269/500000] + train/ActionL1Loss=0.0499 + throughput/total_tokens=2,355,648,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12270/500000] + train/ActionL1Loss=0.0406 + throughput/total_tokens=2,355,840,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=12271/500000] + train/ActionL1Loss=0.0674 + throughput/total_tokens=2,356,032,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=12272/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,356,224,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12273/500000] + train/ActionL1Loss=0.0399 + throughput/total_tokens=2,356,416,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12274/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=2,356,608,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12275/500000] + train/ActionL1Loss=0.0615 + throughput/total_tokens=2,356,800,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=12276/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,356,992,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=12277/500000] + train/ActionL1Loss=0.0327 + throughput/total_tokens=2,357,184,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=12278/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=2,357,376,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12279/500000] + train/ActionL1Loss=0.0388 + throughput/total_tokens=2,357,568,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12280/500000] + optim/total_grad_norm=8.763 + train/ActionL1Loss=0.0312 + throughput/total_tokens=2,357,760,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=12281/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,357,952,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=12282/500000] + train/ActionL1Loss=0.0316 + throughput/total_tokens=2,358,144,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12283/500000] + train/ActionL1Loss=0.0577 + throughput/total_tokens=2,358,336,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=12284/500000] + train/ActionL1Loss=0.0516 + throughput/total_tokens=2,358,528,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12285/500000] + train/ActionL1Loss=0.0453 + throughput/total_tokens=2,358,720,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12286/500000] + train/ActionL1Loss=0.0521 + throughput/total_tokens=2,358,912,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12287/500000] + train/ActionL1Loss=0.0543 + throughput/total_tokens=2,359,104,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12288/500000] + train/ActionL1Loss=0.0337 + throughput/total_tokens=2,359,296,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12289/500000] + train/ActionL1Loss=0.0517 + throughput/total_tokens=2,359,488,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12290/500000] + train/ActionL1Loss=0.0339 + throughput/total_tokens=2,359,680,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=12291/500000] + train/ActionL1Loss=0.0378 + throughput/total_tokens=2,359,872,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12292/500000] + train/ActionL1Loss=0.0320 + throughput/total_tokens=2,360,064,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 +[step=12293/500000] + train/ActionL1Loss=0.0496 + throughput/total_tokens=2,360,256,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=12294/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=2,360,448,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=12295/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=2,360,640,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0492 +[step=12296/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=2,360,832,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12297/500000] + train/ActionL1Loss=0.0500 + throughput/total_tokens=2,361,024,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12298/500000] + train/ActionL1Loss=0.0466 + throughput/total_tokens=2,361,216,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12299/500000] + train/ActionL1Loss=0.0394 + throughput/total_tokens=2,361,408,000 + throughput/device/tokens_per_second=1,180 + throughput/device/batches_per_second=0.0492 +[step=12300/500000] + optim/total_grad_norm=9.073 + train/ActionL1Loss=0.0482 + throughput/total_tokens=2,361,600,000 + throughput/device/tokens_per_second=1,181 + throughput/device/batches_per_second=0.0492 + System/Peak GPU Memory (MB)=46,924 +[step=12301/500000] + train/ActionL1Loss=0.0569 + throughput/total_tokens=2,361,792,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12302/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=2,361,984,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12303/500000] + train/ActionL1Loss=0.0335 + throughput/total_tokens=2,362,176,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12304/500000] + train/ActionL1Loss=0.0420 + throughput/total_tokens=2,362,368,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12305/500000] + train/ActionL1Loss=0.0591 + throughput/total_tokens=2,362,560,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12306/500000] + train/ActionL1Loss=0.0508 + throughput/total_tokens=2,362,752,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12307/500000] + train/ActionL1Loss=0.0456 + throughput/total_tokens=2,362,944,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12308/500000] + train/ActionL1Loss=0.0416 + throughput/total_tokens=2,363,136,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12309/500000] + train/ActionL1Loss=0.0414 + throughput/total_tokens=2,363,328,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12310/500000] + train/ActionL1Loss=0.0262 + throughput/total_tokens=2,363,520,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=12311/500000] + train/ActionL1Loss=0.0432 + throughput/total_tokens=2,363,712,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12312/500000] + train/ActionL1Loss=0.0520 + throughput/total_tokens=2,363,904,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12313/500000] + train/ActionL1Loss=0.0387 + throughput/total_tokens=2,364,096,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12314/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=2,364,288,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12315/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=2,364,480,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12316/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=2,364,672,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12317/500000] + train/ActionL1Loss=0.0397 + throughput/total_tokens=2,364,864,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0489 +[step=12318/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=2,365,056,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=12319/500000] + train/ActionL1Loss=0.0396 + throughput/total_tokens=2,365,248,000 + throughput/device/tokens_per_second=1,173 + throughput/device/batches_per_second=0.0489 +[step=12320/500000] + optim/total_grad_norm=7.616 + train/ActionL1Loss=0.0395 + throughput/total_tokens=2,365,440,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=12321/500000] + train/ActionL1Loss=0.0375 + throughput/total_tokens=2,365,632,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12322/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=2,365,824,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12323/500000] + train/ActionL1Loss=0.0306 + throughput/total_tokens=2,366,016,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12324/500000] + train/ActionL1Loss=0.0463 + throughput/total_tokens=2,366,208,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12325/500000] + train/ActionL1Loss=0.0398 + throughput/total_tokens=2,366,400,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12326/500000] + train/ActionL1Loss=0.0315 + throughput/total_tokens=2,366,592,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12327/500000] + train/ActionL1Loss=0.0355 + throughput/total_tokens=2,366,784,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12328/500000] + train/ActionL1Loss=0.0457 + throughput/total_tokens=2,366,976,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12329/500000] + train/ActionL1Loss=0.0299 + throughput/total_tokens=2,367,168,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12330/500000] + train/ActionL1Loss=0.0216 + throughput/total_tokens=2,367,360,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=12331/500000] + train/ActionL1Loss=0.0467 + throughput/total_tokens=2,367,552,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12332/500000] + train/ActionL1Loss=0.0413 + throughput/total_tokens=2,367,744,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12333/500000] + train/ActionL1Loss=0.0390 + throughput/total_tokens=2,367,936,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12334/500000] + train/ActionL1Loss=0.0461 + throughput/total_tokens=2,368,128,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12335/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=2,368,320,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12336/500000] + train/ActionL1Loss=0.0434 + throughput/total_tokens=2,368,512,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12337/500000] + train/ActionL1Loss=0.0370 + throughput/total_tokens=2,368,704,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0490 +[step=12338/500000] + train/ActionL1Loss=0.0197 + throughput/total_tokens=2,368,896,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12339/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=2,369,088,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12340/500000] + optim/total_grad_norm=8.639 + train/ActionL1Loss=0.0502 + throughput/total_tokens=2,369,280,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=12341/500000] + train/ActionL1Loss=0.0393 + throughput/total_tokens=2,369,472,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12342/500000] + train/ActionL1Loss=0.0265 + throughput/total_tokens=2,369,664,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12343/500000] + train/ActionL1Loss=0.0440 + throughput/total_tokens=2,369,856,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12344/500000] + train/ActionL1Loss=0.0327 + throughput/total_tokens=2,370,048,000 + throughput/device/tokens_per_second=1,177 + throughput/device/batches_per_second=0.0491 +[step=12345/500000] + train/ActionL1Loss=0.0515 + throughput/total_tokens=2,370,240,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12346/500000] + train/ActionL1Loss=0.0348 + throughput/total_tokens=2,370,432,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12347/500000] + train/ActionL1Loss=0.0299 + throughput/total_tokens=2,370,624,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12348/500000] + train/ActionL1Loss=0.0418 + throughput/total_tokens=2,370,816,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12349/500000] + train/ActionL1Loss=0.0492 + throughput/total_tokens=2,371,008,000 + throughput/device/tokens_per_second=1,178 + throughput/device/batches_per_second=0.0491 +[step=12350/500000] + train/ActionL1Loss=0.0529 + throughput/total_tokens=2,371,200,000 + throughput/device/tokens_per_second=1,179 + throughput/device/batches_per_second=0.0491 + System/Peak GPU Memory (MB)=46,924 +[step=12351/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=2,371,392,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12352/500000] + train/ActionL1Loss=0.0523 + throughput/total_tokens=2,371,584,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12353/500000] + train/ActionL1Loss=0.0439 + throughput/total_tokens=2,371,776,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12354/500000] + train/ActionL1Loss=0.0362 + throughput/total_tokens=2,371,968,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12355/500000] + train/ActionL1Loss=0.0341 + throughput/total_tokens=2,372,160,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12356/500000] + train/ActionL1Loss=0.0408 + throughput/total_tokens=2,372,352,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12357/500000] + train/ActionL1Loss=0.0507 + throughput/total_tokens=2,372,544,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12358/500000] + train/ActionL1Loss=0.0280 + throughput/total_tokens=2,372,736,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12359/500000] + train/ActionL1Loss=0.0561 + throughput/total_tokens=2,372,928,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12360/500000] + optim/total_grad_norm=8.605 + train/ActionL1Loss=0.0382 + throughput/total_tokens=2,373,120,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 + System/Peak GPU Memory (MB)=46,924 +[step=12361/500000] + train/ActionL1Loss=0.0510 + throughput/total_tokens=2,373,312,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12362/500000] + train/ActionL1Loss=0.0326 + throughput/total_tokens=2,373,504,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12363/500000] + train/ActionL1Loss=0.0459 + throughput/total_tokens=2,373,696,000 + throughput/device/tokens_per_second=1,176 + throughput/device/batches_per_second=0.0490 +[step=12364/500000] + train/ActionL1Loss=0.0454 + throughput/total_tokens=2,373,888,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12365/500000] + train/ActionL1Loss=0.0548 + throughput/total_tokens=2,374,080,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12366/500000] + train/ActionL1Loss=0.0526 + throughput/total_tokens=2,374,272,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12367/500000] + train/ActionL1Loss=0.0415 + throughput/total_tokens=2,374,464,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12368/500000] + train/ActionL1Loss=0.0535 + throughput/total_tokens=2,374,656,000 + throughput/device/tokens_per_second=1,175 + throughput/device/batches_per_second=0.0490 +[step=12369/500000] + train/ActionL1Loss=0.0444 + throughput/total_tokens=2,374,848,000 + throughput/device/tokens_per_second=1,174 + throughput/device/batches_per_second=0.0490 diff --git a/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/logs/debug-core.log b/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/logs/debug-core.log new file mode 100644 index 0000000000000000000000000000000000000000..d7c22af20496037043449115975532679faf5cfc --- /dev/null +++ b/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/logs/debug-core.log @@ -0,0 +1,6 @@ +{"time":"2025-10-11T16:38:45.197330387Z","level":"INFO","msg":"main: starting server","port-filename":"/tmp/tmpygij4s57/port-579278.txt","pid":579278,"log-level":0,"disable-analytics":false,"shutdown-on-parent-exit":false,"enable-dcgm-profiling":false} +{"time":"2025-10-11T16:38:45.198122306Z","level":"INFO","msg":"server: will exit if parent process dies","ppid":579278} +{"time":"2025-10-11T16:38:45.199702094Z","level":"INFO","msg":"server: accepting connections","addr":{"Name":"/tmp/wandb-579278-579454-1269370264/socket","Net":"unix"}} +{"time":"2025-10-11T16:38:45.353337002Z","level":"INFO","msg":"connection: ManageConnectionData: new connection created","id":"1(@)"} +{"time":"2025-10-11T16:38:45.368049369Z","level":"INFO","msg":"handleInformInit: received","streamId":"qzez8pv7","id":"1(@)"} +{"time":"2025-10-11T16:38:46.624632949Z","level":"INFO","msg":"handleInformInit: stream started","streamId":"qzez8pv7","id":"1(@)"} diff --git a/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/logs/debug-internal.log b/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/logs/debug-internal.log new file mode 100644 index 0000000000000000000000000000000000000000..386717a53f873d08b6a50146f5882cde5ce853d2 --- /dev/null +++ b/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/logs/debug-internal.log @@ -0,0 +1,12 @@ +{"time":"2025-10-11T16:38:45.369810639Z","level":"INFO","msg":"stream: starting","core version":"0.21.4"} +{"time":"2025-10-11T16:38:46.624568558Z","level":"INFO","msg":"stream: created new stream","id":"qzez8pv7"} +{"time":"2025-10-11T16:38:46.624626598Z","level":"INFO","msg":"stream: started","id":"qzez8pv7"} +{"time":"2025-10-11T16:38:46.624662329Z","level":"INFO","msg":"sender: started","stream_id":"qzez8pv7"} +{"time":"2025-10-11T16:38:46.624681929Z","level":"INFO","msg":"handler: started","stream_id":"qzez8pv7"} +{"time":"2025-10-11T16:38:46.624653129Z","level":"INFO","msg":"writer: started","stream_id":"qzez8pv7"} +{"time":"2025-10-11T20:03:56.095706913Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"} +{"time":"2025-10-13T02:33:28.920574862Z","level":"INFO","msg":"api: retrying HTTP error","status":502,"url":"https://api.wandb.ai/files/henryeap/a1-realworld/qzez8pv7/file_stream","body":"\n\n\n502 Server Error\n\n\n

Error: Server Error

\n

The server encountered a temporary error and could not complete your request.

Please try again in 30 seconds.

\n

\n\n"} +{"time":"2025-10-13T16:23:56.963675478Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"} +{"time":"2025-10-13T20:04:02.844107426Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"} +{"time":"2025-10-13T22:38:31.203849115Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": context deadline exceeded (Client.Timeout exceeded while awaiting headers)"} +{"time":"2025-10-14T15:32:47.24166171Z","level":"INFO","msg":"api: retrying error","error":"Post \"https://api.wandb.ai/graphql\": net/http: request canceled (Client.Timeout exceeded while awaiting headers)"} diff --git a/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/logs/debug.log b/eraser_l1_regression/wandb/wandb/run-20251011_163844-qzez8pv7/logs/debug.log new file mode 100644 index 0000000000000000000000000000000000000000..e69de29bb2d1d6434b8b29ae775ad8c2e48c5391 diff --git a/glue_flow_matching/step11500-action-head/metadata.pt b/glue_flow_matching/step11500-action-head/metadata.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e34304d65d6217c2b0a33ee0a75ccecc5e8f82c --- /dev/null +++ b/glue_flow_matching/step11500-action-head/metadata.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fb72b6306ce04d1beb20bb289509f00c39a40845ff7c4b36bf4deb4e83fe82a +size 1331 diff --git a/glue_flow_matching/step12000-action-head/metadata.pt b/glue_flow_matching/step12000-action-head/metadata.pt new file mode 100644 index 0000000000000000000000000000000000000000..752c8b547c4cac7f78746ac5066032167b1cf3c1 --- /dev/null +++ b/glue_flow_matching/step12000-action-head/metadata.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:995307502120af3866f237cd0bc484fc848a652539d28e53cbea882abc16ba6b +size 1331 diff --git a/glue_flow_matching/step12000-unsharded/lora.pt b/glue_flow_matching/step12000-unsharded/lora.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3eb8fc48e155d8229340760896a20ba9fc413e2 --- /dev/null +++ b/glue_flow_matching/step12000-unsharded/lora.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b09055f15a54dd092b4dd30833406731057005822da0c55c16231cf2e68f7f6 +size 1243 diff --git a/glue_flow_matching/step12000-unsharded/train.pt b/glue_flow_matching/step12000-unsharded/train.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e6823c52299a33b82c93e46b47d60826516a853 --- /dev/null +++ b/glue_flow_matching/step12000-unsharded/train.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7925040e6d261a8079db04992b9e7db6ca5303a21d88a9140e264004450bace7 +size 15061 diff --git a/glue_l1_regression/step11500-action-head/metadata.pt b/glue_l1_regression/step11500-action-head/metadata.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcf35cc50d811be8391b077330fc58f140a6565a --- /dev/null +++ b/glue_l1_regression/step11500-action-head/metadata.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f3468869fca8c228cf940661de292bc786f2b18fa96d39a892606183f8dd9c0 +size 1331 diff --git a/glue_l1_regression/step12000-action-head/metadata.pt b/glue_l1_regression/step12000-action-head/metadata.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd2f224af58612b62d81033fb0bfb23b0ab41a53 --- /dev/null +++ b/glue_l1_regression/step12000-action-head/metadata.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:620f952d81c645b6e811733acfcda83cb57d683353c484746edb322f5094c21e +size 1331 diff --git a/glue_l1_regression/step12000-unsharded/lora.pt b/glue_l1_regression/step12000-unsharded/lora.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3eb8fc48e155d8229340760896a20ba9fc413e2 --- /dev/null +++ b/glue_l1_regression/step12000-unsharded/lora.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b09055f15a54dd092b4dd30833406731057005822da0c55c16231cf2e68f7f6 +size 1243 diff --git a/glue_l1_regression/step12000-unsharded/train.pt b/glue_l1_regression/step12000-unsharded/train.pt new file mode 100644 index 0000000000000000000000000000000000000000..a75a8cfd72d2397fc68c4204e10d750e25168d39 --- /dev/null +++ b/glue_l1_regression/step12000-unsharded/train.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0add07bb7303cce1575bd55655e1100f3ad78768d913c98e0008fec041c506f +size 15061 diff --git a/pen_flow_matching/step12000-unsharded/train.pt b/pen_flow_matching/step12000-unsharded/train.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bce1f695d46d3c80745259b348850d69aa57147 --- /dev/null +++ b/pen_flow_matching/step12000-unsharded/train.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5dc3049b151b366f3fbb7cceb103c236af549d6d88c1ce9e97284f067a36ad4b +size 15061 diff --git a/wandb/wandb/run-20251002_150921-kqbx0cjv/run-kqbx0cjv.wandb b/wandb/wandb/run-20251002_150921-kqbx0cjv/run-kqbx0cjv.wandb new file mode 100644 index 0000000000000000000000000000000000000000..e677f99b36a0ea9d181ee618b4b38ba761e0cba5 --- /dev/null +++ b/wandb/wandb/run-20251002_150921-kqbx0cjv/run-kqbx0cjv.wandb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeec1dd1d51418ce6f5612a68cab147386b6073e65014f124ae04fb4d527e4e5 +size 2031616 diff --git a/wandb/wandb/run-20251002_151047-gal9lnsm/run-gal9lnsm.wandb b/wandb/wandb/run-20251002_151047-gal9lnsm/run-gal9lnsm.wandb new file mode 100644 index 0000000000000000000000000000000000000000..9258bdbe98dfb03c4216a7f297389c7e1a68ec89 --- /dev/null +++ b/wandb/wandb/run-20251002_151047-gal9lnsm/run-gal9lnsm.wandb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:559eaaa6a467f7a1e33623030b03745684f069bb32c1a69077166d8d1c8f0b06 +size 1441792 diff --git a/wandb/wandb/run-20251002_155441-70dhy5dq/run-70dhy5dq.wandb b/wandb/wandb/run-20251002_155441-70dhy5dq/run-70dhy5dq.wandb new file mode 100644 index 0000000000000000000000000000000000000000..c3d6c22d1d26f164aff150cde7c7c3e7580cab8f --- /dev/null +++ b/wandb/wandb/run-20251002_155441-70dhy5dq/run-70dhy5dq.wandb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:552a1481b0900b10948b3e1155bbc44b1bb40df456569b2985a9c6e7dc7058ff +size 1376256 diff --git a/wipe_l1_regression/wandb/wandb/run-20251005_163743-a1znetn8/run-a1znetn8.wandb b/wipe_l1_regression/wandb/wandb/run-20251005_163743-a1znetn8/run-a1znetn8.wandb new file mode 100644 index 0000000000000000000000000000000000000000..b5e19786c31d3f6f87b81e7d730a6ad461f3e744 --- /dev/null +++ b/wipe_l1_regression/wandb/wandb/run-20251005_163743-a1znetn8/run-a1znetn8.wandb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8189b4c2131ae4163525b4d10f793c57a4fd8daecc42141cc76acd79b7248dcc +size 412090368